103b705cfSriastradh/*
203b705cfSriastradh * Copyright (c) 2011 Intel Corporation
303b705cfSriastradh *
403b705cfSriastradh * Permission is hereby granted, free of charge, to any person obtaining a
503b705cfSriastradh * copy of this software and associated documentation files (the "Software"),
603b705cfSriastradh * to deal in the Software without restriction, including without limitation
703b705cfSriastradh * the rights to use, copy, modify, merge, publish, distribute, sublicense,
803b705cfSriastradh * and/or sell copies of the Software, and to permit persons to whom the
903b705cfSriastradh * Software is furnished to do so, subject to the following conditions:
1003b705cfSriastradh *
1103b705cfSriastradh * The above copyright notice and this permission notice (including the next
1203b705cfSriastradh * paragraph) shall be included in all copies or substantial portions of the
1303b705cfSriastradh * Software.
1403b705cfSriastradh *
1503b705cfSriastradh * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1603b705cfSriastradh * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
1703b705cfSriastradh * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
1803b705cfSriastradh * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
1903b705cfSriastradh * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2003b705cfSriastradh * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
2103b705cfSriastradh * SOFTWARE.
2203b705cfSriastradh *
2303b705cfSriastradh * Authors:
2403b705cfSriastradh *    Chris Wilson <chris@chris-wilson.co.uk>
2503b705cfSriastradh *
2603b705cfSriastradh */
2703b705cfSriastradh
2803b705cfSriastradh#ifdef HAVE_CONFIG_H
2903b705cfSriastradh#include "config.h"
3003b705cfSriastradh#endif
3103b705cfSriastradh
3203b705cfSriastradh#include "sna.h"
3303b705cfSriastradh#include "sna_reg.h"
3403b705cfSriastradh
3503b705cfSriastradh#include <unistd.h>
3603b705cfSriastradh#include <sys/ioctl.h>
3703b705cfSriastradh#include <sys/mman.h>
389a906b70Schristos#include <sys/stat.h>
3903b705cfSriastradh#include <time.h>
409a906b70Schristos#include <sched.h>
4103b705cfSriastradh#include <errno.h>
4203b705cfSriastradh#include <fcntl.h>
4303b705cfSriastradh
4403b705cfSriastradh#include <xf86drm.h>
4503b705cfSriastradh
4603b705cfSriastradh#ifdef HAVE_VALGRIND
4703b705cfSriastradh#include <valgrind.h>
4803b705cfSriastradh#include <memcheck.h>
4903b705cfSriastradh#endif
5003b705cfSriastradh
5103b705cfSriastradh#ifdef HAVE_STRUCT_SYSINFO_TOTALRAM
5203b705cfSriastradh#include <sys/sysinfo.h>
5303b705cfSriastradh#endif
5403b705cfSriastradh
5503b705cfSriastradh#include "sna_cpuid.h"
5603b705cfSriastradh
5703b705cfSriastradhstatic struct kgem_bo *
5803b705cfSriastradhsearch_linear_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags);
5903b705cfSriastradh
6003b705cfSriastradhstatic struct kgem_bo *
6103b705cfSriastradhsearch_snoop_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags);
6203b705cfSriastradh
6303b705cfSriastradh#define DBG_NO_HW 0
649a906b70Schristos#define DBG_NO_EXEC 0
6503b705cfSriastradh#define DBG_NO_TILING 0
6603b705cfSriastradh#define DBG_NO_CACHE 0
679a906b70Schristos#define DBG_NO_SNOOP_CACHE 0
6803b705cfSriastradh#define DBG_NO_CACHE_LEVEL 0
6903b705cfSriastradh#define DBG_NO_CPU 0
7003b705cfSriastradh#define DBG_NO_CREATE2 0
7103b705cfSriastradh#define DBG_NO_USERPTR 0
7203b705cfSriastradh#define DBG_NO_UNSYNCHRONIZED_USERPTR 0
7363ef14f0Smrg#define DBG_NO_COHERENT_MMAP_GTT 0
7403b705cfSriastradh#define DBG_NO_LLC 0
7503b705cfSriastradh#define DBG_NO_SEMAPHORES 0
7603b705cfSriastradh#define DBG_NO_MADV 0
7703b705cfSriastradh#define DBG_NO_UPLOAD_CACHE 0
7803b705cfSriastradh#define DBG_NO_UPLOAD_ACTIVE 0
7903b705cfSriastradh#define DBG_NO_MAP_UPLOAD 0
8003b705cfSriastradh#define DBG_NO_RELAXED_FENCING 0
8103b705cfSriastradh#define DBG_NO_SECURE_BATCHES 0
8203b705cfSriastradh#define DBG_NO_PINNED_BATCHES 0
83813957e3Ssnj#define DBG_NO_SHRINK_BATCHES 0
8403b705cfSriastradh#define DBG_NO_FAST_RELOC 0
8503b705cfSriastradh#define DBG_NO_HANDLE_LUT 0
8603b705cfSriastradh#define DBG_NO_WT 0
87813957e3Ssnj#define DBG_NO_WC_MMAP 0
8863ef14f0Smrg#define DBG_NO_BLT_Y 0
8963ef14f0Smrg#define DBG_NO_SCANOUT_Y 0
9063ef14f0Smrg#define DBG_NO_DIRTYFB 0
9163ef14f0Smrg#define DBG_NO_DETILING 0
9203b705cfSriastradh#define DBG_DUMP 0
939a906b70Schristos#define DBG_NO_MALLOC_CACHE 0
9403b705cfSriastradh
9503b705cfSriastradh#define FORCE_MMAP_SYNC 0 /* ((1 << DOMAIN_CPU) | (1 << DOMAIN_GTT)) */
9603b705cfSriastradh
9703b705cfSriastradh#ifndef DEBUG_SYNC
9803b705cfSriastradh#define DEBUG_SYNC 0
9903b705cfSriastradh#endif
10003b705cfSriastradh
1019a906b70Schristos#define SHOW_BATCH_BEFORE 0
1029a906b70Schristos#define SHOW_BATCH_AFTER 0
10303b705cfSriastradh
10403b705cfSriastradh#if 0
10503b705cfSriastradh#define ASSERT_IDLE(kgem__, handle__) assert(!__kgem_busy(kgem__, handle__))
10603b705cfSriastradh#define ASSERT_MAYBE_IDLE(kgem__, handle__, expect__) assert(!(expect__) || !__kgem_busy(kgem__, handle__))
10703b705cfSriastradh#else
10803b705cfSriastradh#define ASSERT_IDLE(kgem__, handle__)
10903b705cfSriastradh#define ASSERT_MAYBE_IDLE(kgem__, handle__, expect__)
11003b705cfSriastradh#endif
11103b705cfSriastradh
11203b705cfSriastradh/* Worst case seems to be 965gm where we cannot write within a cacheline that
11303b705cfSriastradh * is being simultaneously being read by the GPU, or within the sampler
11403b705cfSriastradh * prefetch. In general, the chipsets seem to have a requirement that sampler
11503b705cfSriastradh * offsets be aligned to a cacheline (64 bytes).
1169a906b70Schristos *
1179a906b70Schristos * Actually, it turns out the BLT color pattern (BR15) has the most severe
1189a906b70Schristos * alignment restrictions, 64 bytes for 8-bpp, 128 bytes for 16-bpp and 256
1199a906b70Schristos * bytes for 32-bpp.
12003b705cfSriastradh */
1219a906b70Schristos#define UPLOAD_ALIGNMENT 256
12203b705cfSriastradh
12303b705cfSriastradh#define PAGE_ALIGN(x) ALIGN(x, PAGE_SIZE)
12403b705cfSriastradh#define NUM_PAGES(x) (((x) + PAGE_SIZE-1) / PAGE_SIZE)
12503b705cfSriastradh
12603b705cfSriastradh#define MAX_GTT_VMA_CACHE 512
12703b705cfSriastradh#define MAX_CPU_VMA_CACHE INT16_MAX
12803b705cfSriastradh#define MAP_PRESERVE_TIME 10
12903b705cfSriastradh
1309a906b70Schristos#define MAKE_USER_MAP(ptr) ((void*)((uintptr_t)(ptr) | 1))
1319a906b70Schristos#define IS_USER_MAP(ptr) ((uintptr_t)(ptr) & 1)
13203b705cfSriastradh
13303b705cfSriastradh#define LOCAL_I915_PARAM_HAS_BLT		11
13403b705cfSriastradh#define LOCAL_I915_PARAM_HAS_RELAXED_FENCING	12
13503b705cfSriastradh#define LOCAL_I915_PARAM_HAS_RELAXED_DELTA	15
136813957e3Ssnj#define LOCAL_I915_PARAM_HAS_LLC		17
13703b705cfSriastradh#define LOCAL_I915_PARAM_HAS_SEMAPHORES		20
13803b705cfSriastradh#define LOCAL_I915_PARAM_HAS_SECURE_BATCHES	23
13903b705cfSriastradh#define LOCAL_I915_PARAM_HAS_PINNED_BATCHES	24
14003b705cfSriastradh#define LOCAL_I915_PARAM_HAS_NO_RELOC		25
14103b705cfSriastradh#define LOCAL_I915_PARAM_HAS_HANDLE_LUT		26
14203b705cfSriastradh#define LOCAL_I915_PARAM_HAS_WT			27
143813957e3Ssnj#define LOCAL_I915_PARAM_MMAP_VERSION		30
14463ef14f0Smrg#define LOCAL_I915_PARAM_MMAP_GTT_COHERENT	52
14503b705cfSriastradh
14603b705cfSriastradh#define LOCAL_I915_EXEC_IS_PINNED		(1<<10)
14703b705cfSriastradh#define LOCAL_I915_EXEC_NO_RELOC		(1<<11)
14803b705cfSriastradh#define LOCAL_I915_EXEC_HANDLE_LUT		(1<<12)
14903b705cfSriastradh
1509a906b70Schristos#define LOCAL_I915_GEM_CREATE2       0x34
15103b705cfSriastradh#define LOCAL_IOCTL_I915_GEM_CREATE2 DRM_IOWR (DRM_COMMAND_BASE + LOCAL_I915_GEM_CREATE2, struct local_i915_gem_create2)
15203b705cfSriastradhstruct local_i915_gem_create2 {
15303b705cfSriastradh	uint64_t size;
15403b705cfSriastradh	uint32_t placement;
15503b705cfSriastradh#define LOCAL_I915_CREATE_PLACEMENT_SYSTEM 0
15603b705cfSriastradh#define LOCAL_I915_CREATE_PLACEMENT_STOLEN 1 /* Cannot use CPU mmaps or pread/pwrite */
15703b705cfSriastradh	uint32_t domain;
15803b705cfSriastradh	uint32_t caching;
15903b705cfSriastradh	uint32_t tiling_mode;
16003b705cfSriastradh	uint32_t stride;
16103b705cfSriastradh	uint32_t flags;
16203b705cfSriastradh	uint32_t pad;
16303b705cfSriastradh	uint32_t handle;
16403b705cfSriastradh};
16503b705cfSriastradh
16603b705cfSriastradh#define LOCAL_I915_GEM_USERPTR       0x33
16703b705cfSriastradh#define LOCAL_IOCTL_I915_GEM_USERPTR DRM_IOWR (DRM_COMMAND_BASE + LOCAL_I915_GEM_USERPTR, struct local_i915_gem_userptr)
16803b705cfSriastradhstruct local_i915_gem_userptr {
16903b705cfSriastradh	uint64_t user_ptr;
17003b705cfSriastradh	uint64_t user_size;
17103b705cfSriastradh	uint32_t flags;
1729a906b70Schristos#define I915_USERPTR_READ_ONLY		0x1
1739a906b70Schristos#define I915_USERPTR_UNSYNCHRONIZED	0x80000000
17403b705cfSriastradh	uint32_t handle;
17503b705cfSriastradh};
17603b705cfSriastradh
17703b705cfSriastradh#define UNCACHED	0
17803b705cfSriastradh#define SNOOPED		1
17903b705cfSriastradh#define DISPLAY		2
18003b705cfSriastradh
18103b705cfSriastradhstruct local_i915_gem_caching {
18203b705cfSriastradh	uint32_t handle;
18303b705cfSriastradh	uint32_t caching;
18403b705cfSriastradh};
18503b705cfSriastradh
18603b705cfSriastradh#define LOCAL_I915_GEM_SET_CACHING	0x2f
1879a906b70Schristos#define LOCAL_I915_GEM_GET_CACHING	0x30
18803b705cfSriastradh#define LOCAL_IOCTL_I915_GEM_SET_CACHING DRM_IOW(DRM_COMMAND_BASE + LOCAL_I915_GEM_SET_CACHING, struct local_i915_gem_caching)
1899a906b70Schristos#define LOCAL_IOCTL_I915_GEM_GET_CACHING DRM_IOW(DRM_COMMAND_BASE + LOCAL_I915_GEM_GET_CACHING, struct local_i915_gem_caching)
19003b705cfSriastradh
19163ef14f0Smrgstruct local_i915_gem_mmap {
19263ef14f0Smrg	uint32_t handle;
19363ef14f0Smrg	uint32_t pad;
19463ef14f0Smrg	uint64_t offset;
19563ef14f0Smrg	uint64_t size;
19663ef14f0Smrg	uint64_t addr_ptr;
19763ef14f0Smrg};
19863ef14f0Smrg#define LOCAL_IOCTL_I915_GEM_MMAP DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MMAP, struct local_i915_gem_mmap)
19963ef14f0Smrg
200813957e3Ssnjstruct local_i915_gem_mmap2 {
201813957e3Ssnj	uint32_t handle;
202813957e3Ssnj	uint32_t pad;
203813957e3Ssnj	uint64_t offset;
204813957e3Ssnj	uint64_t size;
205813957e3Ssnj	uint64_t addr_ptr;
206813957e3Ssnj	uint64_t flags;
207813957e3Ssnj#define I915_MMAP_WC 0x1
208813957e3Ssnj};
209813957e3Ssnj#define LOCAL_IOCTL_I915_GEM_MMAP_v2 DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MMAP, struct local_i915_gem_mmap2)
210813957e3Ssnj
21103b705cfSriastradhstruct kgem_buffer {
21203b705cfSriastradh	struct kgem_bo base;
21303b705cfSriastradh	void *mem;
21403b705cfSriastradh	uint32_t used;
21503b705cfSriastradh	uint32_t need_io : 1;
21603b705cfSriastradh	uint32_t write : 2;
2179a906b70Schristos	uint32_t mmapped : 2;
2189a906b70Schristos};
2199a906b70Schristosenum {
2209a906b70Schristos	MMAPPED_NONE,
2219a906b70Schristos	MMAPPED_GTT,
2229a906b70Schristos	MMAPPED_CPU
22303b705cfSriastradh};
22403b705cfSriastradh
22503b705cfSriastradhstatic struct kgem_bo *__kgem_freed_bo;
22603b705cfSriastradhstatic struct kgem_request *__kgem_freed_request;
22703b705cfSriastradhstatic struct drm_i915_gem_exec_object2 _kgem_dummy_exec;
22803b705cfSriastradh
22963ef14f0Smrgstatic inline struct sna *__to_sna(struct kgem *kgem)
23063ef14f0Smrg{
23163ef14f0Smrg	/* minor layering violations */
23263ef14f0Smrg	return container_of(kgem, struct sna, kgem);
23363ef14f0Smrg}
23463ef14f0Smrg
23503b705cfSriastradhstatic inline int bytes(struct kgem_bo *bo)
23603b705cfSriastradh{
23703b705cfSriastradh	return __kgem_bo_size(bo);
23803b705cfSriastradh}
23903b705cfSriastradh
24003b705cfSriastradh#define bucket(B) (B)->size.pages.bucket
24103b705cfSriastradh#define num_pages(B) (B)->size.pages.count
24203b705cfSriastradh
24363ef14f0Smrgstatic int __do_ioctl(int fd, unsigned long req, void *arg)
2449a906b70Schristos{
24563ef14f0Smrg	do {
24663ef14f0Smrg		int err;
2479a906b70Schristos
24863ef14f0Smrg		switch ((err = errno)) {
24963ef14f0Smrg		case EAGAIN:
25063ef14f0Smrg			sched_yield();
25163ef14f0Smrg		case EINTR:
25263ef14f0Smrg			break;
25363ef14f0Smrg		default:
25463ef14f0Smrg			return -err;
25563ef14f0Smrg		}
2569a906b70Schristos
25763ef14f0Smrg		if (likely(ioctl(fd, req, arg) == 0))
25863ef14f0Smrg			return 0;
25963ef14f0Smrg	} while (1);
26063ef14f0Smrg}
2619a906b70Schristos
26263ef14f0Smrginline static int do_ioctl(int fd, unsigned long req, void *arg)
26363ef14f0Smrg{
26463ef14f0Smrg	if (likely(ioctl(fd, req, arg) == 0))
26563ef14f0Smrg		return 0;
2669a906b70Schristos
26763ef14f0Smrg	return __do_ioctl(fd, req, arg);
2689a906b70Schristos}
2699a906b70Schristos
27003b705cfSriastradh#ifdef DEBUG_MEMORY
27103b705cfSriastradhstatic void debug_alloc(struct kgem *kgem, size_t size)
27203b705cfSriastradh{
27303b705cfSriastradh	kgem->debug_memory.bo_allocs++;
27403b705cfSriastradh	kgem->debug_memory.bo_bytes += size;
27503b705cfSriastradh}
27603b705cfSriastradhstatic void debug_alloc__bo(struct kgem *kgem, struct kgem_bo *bo)
27703b705cfSriastradh{
27803b705cfSriastradh	debug_alloc(kgem, bytes(bo));
27903b705cfSriastradh}
28003b705cfSriastradh#else
28103b705cfSriastradh#define debug_alloc__bo(k, b)
28203b705cfSriastradh#endif
28303b705cfSriastradh
28403b705cfSriastradh#ifndef NDEBUG
28503b705cfSriastradhstatic void assert_tiling(struct kgem *kgem, struct kgem_bo *bo)
28603b705cfSriastradh{
28703b705cfSriastradh	struct drm_i915_gem_get_tiling tiling;
28803b705cfSriastradh
28903b705cfSriastradh	assert(bo);
29003b705cfSriastradh
29163ef14f0Smrg	if (!kgem->can_fence && kgem->gen >= 040 && bo->tiling)
29263ef14f0Smrg		return; /* lies */
29363ef14f0Smrg
29403b705cfSriastradh	VG_CLEAR(tiling);
29503b705cfSriastradh	tiling.handle = bo->handle;
2969a906b70Schristos	tiling.tiling_mode = bo->tiling;
2979a906b70Schristos	(void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling);
29803b705cfSriastradh	assert(tiling.tiling_mode == bo->tiling);
29903b705cfSriastradh}
3009a906b70Schristos
30163ef14f0Smrgstatic void assert_caching(struct kgem *kgem, struct kgem_bo *bo)
3029a906b70Schristos{
3039a906b70Schristos	struct local_i915_gem_caching arg;
3049a906b70Schristos	int expect = kgem->has_llc ? SNOOPED : UNCACHED;
3059a906b70Schristos
3069a906b70Schristos	VG_CLEAR(arg);
3079a906b70Schristos	arg.handle = bo->handle;
3089a906b70Schristos	arg.caching = expect;
3099a906b70Schristos
3109a906b70Schristos	(void)do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_GET_CACHING, &arg);
3119a906b70Schristos
3129a906b70Schristos	assert(arg.caching == expect);
3139a906b70Schristos}
3149a906b70Schristos
3159a906b70Schristosstatic void assert_bo_retired(struct kgem_bo *bo)
3169a906b70Schristos{
3179a906b70Schristos	DBG(("%s: handle=%d, domain: %d exec? %d, rq? %d\n", __FUNCTION__,
3189a906b70Schristos	     bo->handle, bo->domain, bo->exec != NULL, bo->rq != NULL));
3199a906b70Schristos	assert(bo->refcnt);
3209a906b70Schristos	assert(bo->rq == NULL);
3219a906b70Schristos	assert(bo->exec == NULL);
32263ef14f0Smrg	assert(!bo->needs_flush);
3239a906b70Schristos	assert(list_is_empty(&bo->request));
3249a906b70Schristos}
32503b705cfSriastradh#else
32603b705cfSriastradh#define assert_tiling(kgem, bo)
32763ef14f0Smrg#define assert_caching(kgem, bo)
3289a906b70Schristos#define assert_bo_retired(bo)
32903b705cfSriastradh#endif
33003b705cfSriastradh
33163ef14f0Smrgstatic int __find_debugfs(struct kgem *kgem)
33263ef14f0Smrg{
33363ef14f0Smrg	int i;
33463ef14f0Smrg
33563ef14f0Smrg	for (i = 0; i < DRM_MAX_MINOR; i++) {
33663ef14f0Smrg		char path[80];
33763ef14f0Smrg
33863ef14f0Smrg		sprintf(path, "/sys/kernel/debug/dri/%d/i915_wedged", i);
33963ef14f0Smrg		if (access(path, R_OK) == 0)
34063ef14f0Smrg			return i;
34163ef14f0Smrg
34263ef14f0Smrg		sprintf(path, "/debug/dri/%d/i915_wedged", i);
34363ef14f0Smrg		if (access(path, R_OK) == 0)
34463ef14f0Smrg			return i;
34563ef14f0Smrg	}
34663ef14f0Smrg
34763ef14f0Smrg	return -1;
34863ef14f0Smrg}
34963ef14f0Smrg
35063ef14f0Smrgstatic int kgem_get_minor(struct kgem *kgem)
35163ef14f0Smrg{
35263ef14f0Smrg	struct stat st;
35363ef14f0Smrg
35463ef14f0Smrg	if (fstat(kgem->fd, &st))
35563ef14f0Smrg		return __find_debugfs(kgem);
35663ef14f0Smrg
35763ef14f0Smrg	if (!S_ISCHR(st.st_mode))
35863ef14f0Smrg		return __find_debugfs(kgem);
35963ef14f0Smrg
36063ef14f0Smrg	return st.st_rdev & 0x63;
36163ef14f0Smrg}
36263ef14f0Smrg
36363ef14f0Smrgstatic bool find_hang_state(struct kgem *kgem, char *path, int maxlen)
36463ef14f0Smrg{
36563ef14f0Smrg	int minor = kgem_get_minor(kgem);
36663ef14f0Smrg
36763ef14f0Smrg	/* Search for our hang state in a few canonical locations.
36863ef14f0Smrg	 * In the unlikely event of having multiple devices, we
36963ef14f0Smrg	 * will need to check which minor actually corresponds to ours.
37063ef14f0Smrg	 */
37163ef14f0Smrg
37263ef14f0Smrg	snprintf(path, maxlen, "/sys/class/drm/card%d/error", minor);
37363ef14f0Smrg	if (access(path, R_OK) == 0)
37463ef14f0Smrg		return true;
37563ef14f0Smrg
37663ef14f0Smrg	snprintf(path, maxlen, "/sys/kernel/debug/dri/%d/i915_error_state", minor);
37763ef14f0Smrg	if (access(path, R_OK) == 0)
37863ef14f0Smrg		return true;
37963ef14f0Smrg
38063ef14f0Smrg	snprintf(path, maxlen, "/debug/dri/%d/i915_error_state", minor);
38163ef14f0Smrg	if (access(path, R_OK) == 0)
38263ef14f0Smrg		return true;
38363ef14f0Smrg
38463ef14f0Smrg	path[0] = '\0';
38563ef14f0Smrg	return false;
38663ef14f0Smrg}
38763ef14f0Smrg
38863ef14f0Smrgstatic bool has_error_state(struct kgem *kgem, char *path)
38963ef14f0Smrg{
39063ef14f0Smrg   bool ret = false;
39163ef14f0Smrg   char no;
39263ef14f0Smrg   int fd;
39363ef14f0Smrg
39463ef14f0Smrg   fd = open(path, O_RDONLY);
39563ef14f0Smrg   if (fd >= 0) {
39663ef14f0Smrg      ret = read(fd, &no, 1) == 1 && no != 'N';
39763ef14f0Smrg      close(fd);
39863ef14f0Smrg   }
39963ef14f0Smrg
40063ef14f0Smrg   return ret;
40163ef14f0Smrg}
40263ef14f0Smrg
40363ef14f0Smrgstatic int kgem_get_screen_index(struct kgem *kgem)
40463ef14f0Smrg{
40563ef14f0Smrg	return __to_sna(kgem)->scrn->scrnIndex;
40663ef14f0Smrg}
40763ef14f0Smrg
408813957e3Ssnjstatic void
409813957e3Ssnj__kgem_set_wedged(struct kgem *kgem)
410813957e3Ssnj{
41163ef14f0Smrg	static int once;
41263ef14f0Smrg	char path[256];
41363ef14f0Smrg
41463ef14f0Smrg	if (kgem->wedged)
41563ef14f0Smrg		return;
41663ef14f0Smrg
41763ef14f0Smrg	if (!once &&
41863ef14f0Smrg	    find_hang_state(kgem, path, sizeof(path)) &&
41963ef14f0Smrg            has_error_state(kgem, path)) {
42063ef14f0Smrg		xf86DrvMsg(kgem_get_screen_index(kgem), X_ERROR,
42163ef14f0Smrg			   "When reporting this, please include %s and the full dmesg.\n",
42263ef14f0Smrg			   path);
42363ef14f0Smrg		once = 1;
42463ef14f0Smrg	}
42563ef14f0Smrg
426813957e3Ssnj	kgem->wedged = true;
42763ef14f0Smrg	sna_render_mark_wedged(__to_sna(kgem));
428813957e3Ssnj}
429813957e3Ssnj
43003b705cfSriastradhstatic void kgem_sna_reset(struct kgem *kgem)
43103b705cfSriastradh{
43263ef14f0Smrg	struct sna *sna = __to_sna(kgem);
43303b705cfSriastradh
43403b705cfSriastradh	sna->render.reset(sna);
43503b705cfSriastradh	sna->blt_state.fill_bo = 0;
43603b705cfSriastradh}
43703b705cfSriastradh
43803b705cfSriastradhstatic void kgem_sna_flush(struct kgem *kgem)
43903b705cfSriastradh{
44063ef14f0Smrg	struct sna *sna = __to_sna(kgem);
44103b705cfSriastradh
44203b705cfSriastradh	sna->render.flush(sna);
44303b705cfSriastradh
44403b705cfSriastradh	if (sna->render.solid_cache.dirty)
44503b705cfSriastradh		sna_render_flush_solid(sna);
44603b705cfSriastradh}
44703b705cfSriastradh
44863ef14f0Smrgstatic bool kgem_bo_rmfb(struct kgem *kgem, struct kgem_bo *bo)
44963ef14f0Smrg{
45063ef14f0Smrg	if (bo->scanout && bo->delta) {
45163ef14f0Smrg		DBG(("%s: releasing fb=%d for handle=%d\n",
45263ef14f0Smrg		     __FUNCTION__, bo->delta, bo->handle));
45363ef14f0Smrg		/* XXX will leak if we are not DRM_MASTER. *shrug* */
45463ef14f0Smrg		do_ioctl(kgem->fd, DRM_IOCTL_MODE_RMFB, &bo->delta);
45563ef14f0Smrg		bo->delta = 0;
45663ef14f0Smrg		return true;
45763ef14f0Smrg	} else
45863ef14f0Smrg		return false;
45963ef14f0Smrg}
46063ef14f0Smrg
46163ef14f0Smrgstatic bool kgem_set_tiling(struct kgem *kgem, struct kgem_bo *bo,
46263ef14f0Smrg			    int tiling, int stride)
46303b705cfSriastradh{
46403b705cfSriastradh	struct drm_i915_gem_set_tiling set_tiling;
4659a906b70Schristos	int err;
46603b705cfSriastradh
46763ef14f0Smrg	if (tiling == bo->tiling) {
46863ef14f0Smrg		if (tiling == I915_TILING_NONE) {
46963ef14f0Smrg			bo->pitch = stride;
47063ef14f0Smrg			return true;
47163ef14f0Smrg		}
47263ef14f0Smrg		if (stride == bo->pitch)
47363ef14f0Smrg			return true;
47463ef14f0Smrg	}
47563ef14f0Smrg
47603b705cfSriastradh	if (DBG_NO_TILING)
47703b705cfSriastradh		return false;
47803b705cfSriastradh
47903b705cfSriastradh	VG_CLEAR(set_tiling);
4809a906b70Schristosrestart:
48163ef14f0Smrg	set_tiling.handle = bo->handle;
4829a906b70Schristos	set_tiling.tiling_mode = tiling;
48363ef14f0Smrg	set_tiling.stride = tiling ? stride : 0;
48403b705cfSriastradh
48563ef14f0Smrg	if (ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_TILING, &set_tiling) == 0) {
48663ef14f0Smrg		bo->tiling = set_tiling.tiling_mode;
48763ef14f0Smrg		bo->pitch = set_tiling.tiling_mode ? set_tiling.stride : stride;
48863ef14f0Smrg		DBG(("%s: handle=%d, tiling=%d [%d], pitch=%d [%d]: %d\n",
48963ef14f0Smrg		     __FUNCTION__, bo->handle,
49063ef14f0Smrg		     bo->tiling, tiling,
49163ef14f0Smrg		     bo->pitch, stride,
49263ef14f0Smrg		     set_tiling.tiling_mode == tiling));
49363ef14f0Smrg		return set_tiling.tiling_mode == tiling && bo->pitch >= stride;
49463ef14f0Smrg	}
4959a906b70Schristos
4969a906b70Schristos	err = errno;
4979a906b70Schristos	if (err == EINTR)
4989a906b70Schristos		goto restart;
4999a906b70Schristos
5009a906b70Schristos	if (err == EAGAIN) {
5019a906b70Schristos		sched_yield();
5029a906b70Schristos		goto restart;
5039a906b70Schristos	}
5049a906b70Schristos
50563ef14f0Smrg	if (err == EBUSY && kgem_bo_rmfb(kgem, bo))
50663ef14f0Smrg		goto restart;
50763ef14f0Smrg
50863ef14f0Smrg	ERR(("%s: failed to set-tiling(tiling=%d, pitch=%d) for handle=%d: %d\n",
50963ef14f0Smrg	     __FUNCTION__, tiling, stride, bo->handle, err));
5109a906b70Schristos	return false;
51103b705cfSriastradh}
51203b705cfSriastradh
51303b705cfSriastradhstatic bool gem_set_caching(int fd, uint32_t handle, int caching)
51403b705cfSriastradh{
51503b705cfSriastradh	struct local_i915_gem_caching arg;
51603b705cfSriastradh
51703b705cfSriastradh	VG_CLEAR(arg);
51803b705cfSriastradh	arg.handle = handle;
51903b705cfSriastradh	arg.caching = caching;
5209a906b70Schristos	return do_ioctl(fd, LOCAL_IOCTL_I915_GEM_SET_CACHING, &arg) == 0;
52103b705cfSriastradh}
52203b705cfSriastradh
52303b705cfSriastradhstatic uint32_t gem_userptr(int fd, void *ptr, int size, int read_only)
52403b705cfSriastradh{
52503b705cfSriastradh	struct local_i915_gem_userptr arg;
52603b705cfSriastradh
52703b705cfSriastradh	VG_CLEAR(arg);
52803b705cfSriastradh	arg.user_ptr = (uintptr_t)ptr;
52903b705cfSriastradh	arg.user_size = size;
53003b705cfSriastradh	arg.flags = I915_USERPTR_UNSYNCHRONIZED;
53103b705cfSriastradh	if (read_only)
53203b705cfSriastradh		arg.flags |= I915_USERPTR_READ_ONLY;
53303b705cfSriastradh
53403b705cfSriastradh	if (DBG_NO_UNSYNCHRONIZED_USERPTR ||
5359a906b70Schristos	    do_ioctl(fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg)) {
53603b705cfSriastradh		arg.flags &= ~I915_USERPTR_UNSYNCHRONIZED;
5379a906b70Schristos		if (do_ioctl(fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg)) {
53803b705cfSriastradh			DBG(("%s: failed to map %p + %d bytes: %d\n",
53903b705cfSriastradh			     __FUNCTION__, ptr, size, errno));
54003b705cfSriastradh			return 0;
54103b705cfSriastradh		}
54203b705cfSriastradh	}
54303b705cfSriastradh
54403b705cfSriastradh	return arg.handle;
54503b705cfSriastradh}
54603b705cfSriastradh
5479a906b70Schristosstatic bool __kgem_throttle(struct kgem *kgem, bool harder)
54803b705cfSriastradh{
5499a906b70Schristos	/* Let this be woken up by sigtimer so that we don't block here
5509a906b70Schristos	 * too much and completely starve X. We will sleep again shortly,
5519a906b70Schristos	 * and so catch up or detect the hang.
5529a906b70Schristos	 */
5539a906b70Schristos	do {
5549a906b70Schristos		if (ioctl(kgem->fd, DRM_IOCTL_I915_GEM_THROTTLE) == 0) {
5559a906b70Schristos			kgem->need_throttle = 0;
5569a906b70Schristos			return false;
5579a906b70Schristos		}
55803b705cfSriastradh
5599a906b70Schristos		if (errno == EIO)
5609a906b70Schristos			return true;
5619a906b70Schristos	} while (harder);
5629a906b70Schristos
5639a906b70Schristos	return false;
5649a906b70Schristos}
5659a906b70Schristos
5669a906b70Schristosstatic bool __kgem_throttle_retire(struct kgem *kgem, unsigned flags)
5679a906b70Schristos{
5689a906b70Schristos	if (flags & CREATE_NO_RETIRE || !kgem->need_retire) {
5699a906b70Schristos		DBG(("%s: not retiring\n", __FUNCTION__));
57003b705cfSriastradh		return false;
57103b705cfSriastradh	}
57203b705cfSriastradh
57303b705cfSriastradh	if (kgem_retire(kgem))
57403b705cfSriastradh		return true;
57503b705cfSriastradh
57603b705cfSriastradh	if (flags & CREATE_NO_THROTTLE || !kgem->need_throttle) {
57703b705cfSriastradh		DBG(("%s: not throttling\n", __FUNCTION__));
57803b705cfSriastradh		return false;
57903b705cfSriastradh	}
58003b705cfSriastradh
5819a906b70Schristos	__kgem_throttle(kgem, false);
58203b705cfSriastradh	return kgem_retire(kgem);
58303b705cfSriastradh}
58403b705cfSriastradh
58503b705cfSriastradhstatic void *__kgem_bo_map__gtt(struct kgem *kgem, struct kgem_bo *bo)
58603b705cfSriastradh{
587813957e3Ssnj	struct drm_i915_gem_mmap_gtt gtt;
58803b705cfSriastradh	void *ptr;
5893d02bce8Sriastradh	int err;
59003b705cfSriastradh
59103b705cfSriastradh	DBG(("%s(handle=%d, size=%d)\n", __FUNCTION__,
59203b705cfSriastradh	     bo->handle, bytes(bo)));
59303b705cfSriastradh
59463ef14f0Smrg	if (bo->tiling && !kgem->can_fence)
59563ef14f0Smrg		return NULL;
59663ef14f0Smrg
597813957e3Ssnj	VG_CLEAR(gtt);
59803b705cfSriastradhretry_gtt:
599813957e3Ssnj	gtt.handle = bo->handle;
600813957e3Ssnj	if ((err = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MMAP_GTT, &gtt))) {
60163ef14f0Smrg		DBG(("%s: failed %d, throttling/cleaning caches\n",
60263ef14f0Smrg		     __FUNCTION__, err));
60303b705cfSriastradh		assert(err != EINVAL);
60403b705cfSriastradh
60503b705cfSriastradh		(void)__kgem_throttle_retire(kgem, 0);
60603b705cfSriastradh		if (kgem_expire_cache(kgem))
60703b705cfSriastradh			goto retry_gtt;
60803b705cfSriastradh
6099a906b70Schristos		if (kgem_cleanup_cache(kgem))
61003b705cfSriastradh			goto retry_gtt;
61103b705cfSriastradh
6129a906b70Schristos		ERR(("%s: failed to retrieve GTT offset for handle=%d: %d\n",
6139a906b70Schristos		     __FUNCTION__, bo->handle, -err));
61403b705cfSriastradh		return NULL;
61503b705cfSriastradh	}
61603b705cfSriastradh
61703b705cfSriastradhretry_mmap:
6189a906b70Schristos	ptr = mmap(0, bytes(bo), PROT_READ | PROT_WRITE, MAP_SHARED,
619813957e3Ssnj		   kgem->fd, gtt.offset);
6209a906b70Schristos	if (ptr == MAP_FAILED) {
6219a906b70Schristos		err = errno;
62263ef14f0Smrg		DBG(("%s: failed %d, throttling/cleaning caches\n",
62363ef14f0Smrg		     __FUNCTION__, err));
62403b705cfSriastradh		assert(err != EINVAL);
62503b705cfSriastradh
62603b705cfSriastradh		if (__kgem_throttle_retire(kgem, 0))
62703b705cfSriastradh			goto retry_mmap;
62803b705cfSriastradh
6299a906b70Schristos		if (kgem_cleanup_cache(kgem))
63003b705cfSriastradh			goto retry_mmap;
63103b705cfSriastradh
6329a906b70Schristos		ERR(("%s: failed to mmap handle=%d, %d bytes, into GTT domain: %d\n",
6339a906b70Schristos		     __FUNCTION__, bo->handle, bytes(bo), err));
63403b705cfSriastradh		ptr = NULL;
63503b705cfSriastradh	}
63603b705cfSriastradh
637813957e3Ssnj	/* Cache this mapping to avoid the overhead of an
638813957e3Ssnj	 * excruciatingly slow GTT pagefault. This is more an
639813957e3Ssnj	 * issue with compositing managers which need to
640813957e3Ssnj	 * frequently flush CPU damage to their GPU bo.
641813957e3Ssnj	 */
642813957e3Ssnj	return bo->map__gtt = ptr;
643813957e3Ssnj}
644813957e3Ssnj
645813957e3Ssnjstatic void *__kgem_bo_map__wc(struct kgem *kgem, struct kgem_bo *bo)
646813957e3Ssnj{
647813957e3Ssnj	struct local_i915_gem_mmap2 wc;
648813957e3Ssnj	int err;
649813957e3Ssnj
650813957e3Ssnj	DBG(("%s(handle=%d, size=%d)\n", __FUNCTION__,
651813957e3Ssnj	     bo->handle, bytes(bo)));
652813957e3Ssnj	assert(kgem->has_wc_mmap);
653813957e3Ssnj
654813957e3Ssnj	VG_CLEAR(wc);
655813957e3Ssnj
656813957e3Ssnjretry_wc:
657813957e3Ssnj	wc.handle = bo->handle;
658813957e3Ssnj	wc.offset = 0;
659813957e3Ssnj	wc.size = bytes(bo);
660813957e3Ssnj	wc.flags = I915_MMAP_WC;
661813957e3Ssnj	if ((err = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_MMAP_v2, &wc))) {
66263ef14f0Smrg		DBG(("%s: failed %d, throttling/cleaning caches\n",
66363ef14f0Smrg		     __FUNCTION__, err));
664813957e3Ssnj		assert(err != EINVAL);
665813957e3Ssnj
666813957e3Ssnj		if (__kgem_throttle_retire(kgem, 0))
667813957e3Ssnj			goto retry_wc;
668813957e3Ssnj
669813957e3Ssnj		if (kgem_cleanup_cache(kgem))
670813957e3Ssnj			goto retry_wc;
671813957e3Ssnj
672813957e3Ssnj		ERR(("%s: failed to mmap handle=%d, %d bytes, into CPU(wc) domain: %d\n",
673813957e3Ssnj		     __FUNCTION__, bo->handle, bytes(bo), -err));
674813957e3Ssnj		return NULL;
675813957e3Ssnj	}
676813957e3Ssnj
677813957e3Ssnj	VG(VALGRIND_MAKE_MEM_DEFINED(wc.addr_ptr, bytes(bo)));
678813957e3Ssnj
679813957e3Ssnj	DBG(("%s: caching CPU(wc) vma for %d\n", __FUNCTION__, bo->handle));
680813957e3Ssnj	return bo->map__wc = (void *)(uintptr_t)wc.addr_ptr;
681813957e3Ssnj}
682813957e3Ssnj
683813957e3Ssnjstatic void *__kgem_bo_map__cpu(struct kgem *kgem, struct kgem_bo *bo)
684813957e3Ssnj{
68563ef14f0Smrg	struct local_i915_gem_mmap arg;
686813957e3Ssnj	int err;
687813957e3Ssnj
68863ef14f0Smrg	VG_CLEAR(arg);
68963ef14f0Smrg	arg.offset = 0;
69063ef14f0Smrg
691813957e3Ssnjretry:
69263ef14f0Smrg	arg.handle = bo->handle;
69363ef14f0Smrg	arg.size = bytes(bo);
69463ef14f0Smrg	if ((err = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_MMAP, &arg))) {
69563ef14f0Smrg		DBG(("%s: failed %d, throttling/cleaning caches\n",
69663ef14f0Smrg		     __FUNCTION__, err));
69763ef14f0Smrg		assert(err != -EINVAL || bo->prime);
698813957e3Ssnj
699813957e3Ssnj		if (__kgem_throttle_retire(kgem, 0))
700813957e3Ssnj			goto retry;
701813957e3Ssnj
702813957e3Ssnj		if (kgem_cleanup_cache(kgem))
703813957e3Ssnj			goto retry;
704813957e3Ssnj
70563ef14f0Smrg		ERR(("%s: failed to mmap handle=%d (prime? %d), %d bytes, into CPU domain: %d\n",
70663ef14f0Smrg		     __FUNCTION__, bo->handle, bo->prime, bytes(bo), -err));
70763ef14f0Smrg		bo->purged = 1;
708813957e3Ssnj		return NULL;
709813957e3Ssnj	}
710813957e3Ssnj
71163ef14f0Smrg	VG(VALGRIND_MAKE_MEM_DEFINED(arg.addr_ptr, bytes(bo)));
712813957e3Ssnj
713813957e3Ssnj	DBG(("%s: caching CPU vma for %d\n", __FUNCTION__, bo->handle));
71463ef14f0Smrg	return bo->map__cpu = (void *)(uintptr_t)arg.addr_ptr;
71503b705cfSriastradh}
71603b705cfSriastradh
7179a906b70Schristosstatic int gem_write(int fd, uint32_t handle,
7189a906b70Schristos		     int offset, int length,
7199a906b70Schristos		     const void *src)
72003b705cfSriastradh{
72103b705cfSriastradh	struct drm_i915_gem_pwrite pwrite;
72203b705cfSriastradh
72303b705cfSriastradh	DBG(("%s(handle=%d, offset=%d, len=%d)\n", __FUNCTION__,
72403b705cfSriastradh	     handle, offset, length));
72503b705cfSriastradh
72603b705cfSriastradh	VG_CLEAR(pwrite);
72703b705cfSriastradh	pwrite.handle = handle;
72803b705cfSriastradh	pwrite.offset = offset;
72903b705cfSriastradh	pwrite.size = length;
73003b705cfSriastradh	pwrite.data_ptr = (uintptr_t)src;
7319a906b70Schristos	return do_ioctl(fd, DRM_IOCTL_I915_GEM_PWRITE, &pwrite);
73203b705cfSriastradh}
73303b705cfSriastradh
7349a906b70Schristosstatic int gem_write__cachealigned(int fd, uint32_t handle,
7359a906b70Schristos				   int offset, int length,
7369a906b70Schristos				   const void *src)
73703b705cfSriastradh{
73803b705cfSriastradh	struct drm_i915_gem_pwrite pwrite;
73903b705cfSriastradh
74003b705cfSriastradh	DBG(("%s(handle=%d, offset=%d, len=%d)\n", __FUNCTION__,
74103b705cfSriastradh	     handle, offset, length));
74203b705cfSriastradh
74303b705cfSriastradh	VG_CLEAR(pwrite);
74403b705cfSriastradh	pwrite.handle = handle;
74503b705cfSriastradh	/* align the transfer to cachelines; fortuitously this is safe! */
74603b705cfSriastradh	if ((offset | length) & 63) {
74703b705cfSriastradh		pwrite.offset = offset & ~63;
74803b705cfSriastradh		pwrite.size = ALIGN(offset+length, 64) - pwrite.offset;
74903b705cfSriastradh		pwrite.data_ptr = (uintptr_t)src + pwrite.offset - offset;
75003b705cfSriastradh	} else {
75103b705cfSriastradh		pwrite.offset = offset;
75203b705cfSriastradh		pwrite.size = length;
75303b705cfSriastradh		pwrite.data_ptr = (uintptr_t)src;
75403b705cfSriastradh	}
7559a906b70Schristos	return do_ioctl(fd, DRM_IOCTL_I915_GEM_PWRITE, &pwrite);
75603b705cfSriastradh}
75703b705cfSriastradh
75803b705cfSriastradhstatic int gem_read(int fd, uint32_t handle, const void *dst,
75903b705cfSriastradh		    int offset, int length)
76003b705cfSriastradh{
76103b705cfSriastradh	struct drm_i915_gem_pread pread;
76203b705cfSriastradh	int ret;
76303b705cfSriastradh
76403b705cfSriastradh	DBG(("%s(handle=%d, len=%d)\n", __FUNCTION__,
76503b705cfSriastradh	     handle, length));
76603b705cfSriastradh
76703b705cfSriastradh	VG_CLEAR(pread);
76803b705cfSriastradh	pread.handle = handle;
76903b705cfSriastradh	pread.offset = offset;
77003b705cfSriastradh	pread.size = length;
77103b705cfSriastradh	pread.data_ptr = (uintptr_t)dst;
7729a906b70Schristos	ret = do_ioctl(fd, DRM_IOCTL_I915_GEM_PREAD, &pread);
77303b705cfSriastradh	if (ret) {
7749a906b70Schristos		DBG(("%s: failed, errno=%d\n", __FUNCTION__, -ret));
77503b705cfSriastradh		return ret;
77603b705cfSriastradh	}
77703b705cfSriastradh
77803b705cfSriastradh	VG(VALGRIND_MAKE_MEM_DEFINED(dst, length));
77903b705cfSriastradh	return 0;
78003b705cfSriastradh}
78103b705cfSriastradh
78203b705cfSriastradhbool __kgem_busy(struct kgem *kgem, int handle)
78303b705cfSriastradh{
78403b705cfSriastradh	struct drm_i915_gem_busy busy;
78503b705cfSriastradh
78603b705cfSriastradh	VG_CLEAR(busy);
78703b705cfSriastradh	busy.handle = handle;
78803b705cfSriastradh	busy.busy = !kgem->wedged;
7899a906b70Schristos	(void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_BUSY, &busy);
79003b705cfSriastradh	DBG(("%s: handle=%d, busy=%d, wedged=%d\n",
79103b705cfSriastradh	     __FUNCTION__, handle, busy.busy, kgem->wedged));
79203b705cfSriastradh
79303b705cfSriastradh	return busy.busy;
79403b705cfSriastradh}
79503b705cfSriastradh
79603b705cfSriastradhstatic void kgem_bo_retire(struct kgem *kgem, struct kgem_bo *bo)
79703b705cfSriastradh{
79803b705cfSriastradh	DBG(("%s: retiring bo handle=%d (needed flush? %d), rq? %d [busy?=%d]\n",
79903b705cfSriastradh	     __FUNCTION__, bo->handle, bo->needs_flush, bo->rq != NULL,
80003b705cfSriastradh	     __kgem_busy(kgem, bo->handle)));
80103b705cfSriastradh	assert(bo->exec == NULL);
80203b705cfSriastradh	assert(list_is_empty(&bo->vma));
80303b705cfSriastradh
80463ef14f0Smrg	if (bo->rq)
80563ef14f0Smrg		__kgem_retire_requests_upto(kgem, bo);
80663ef14f0Smrg	ASSERT_IDLE(kgem, bo->handle);
80763ef14f0Smrg	assert_bo_retired(bo);
8089a906b70Schristos}
8099a906b70Schristos
8109a906b70Schristosstatic void kgem_bo_maybe_retire(struct kgem *kgem, struct kgem_bo *bo)
8119a906b70Schristos{
8129a906b70Schristos	DBG(("%s: retiring bo handle=%d (needed flush? %d), rq? %d [busy?=%d]\n",
8139a906b70Schristos	     __FUNCTION__, bo->handle, bo->needs_flush, bo->rq != NULL,
8149a906b70Schristos	     __kgem_busy(kgem, bo->handle)));
8159a906b70Schristos	assert(bo->exec == NULL);
8169a906b70Schristos	assert(list_is_empty(&bo->vma));
8179a906b70Schristos
81803b705cfSriastradh	if (bo->rq) {
81963ef14f0Smrg		if (!__kgem_busy(kgem, bo->handle))
82063ef14f0Smrg			__kgem_retire_requests_upto(kgem, bo);
82103b705cfSriastradh	} else {
82203b705cfSriastradh		assert(!bo->needs_flush);
82303b705cfSriastradh		ASSERT_IDLE(kgem, bo->handle);
82403b705cfSriastradh	}
82503b705cfSriastradh}
82603b705cfSriastradh
82703b705cfSriastradhbool kgem_bo_write(struct kgem *kgem, struct kgem_bo *bo,
82803b705cfSriastradh		   const void *data, int length)
82903b705cfSriastradh{
830813957e3Ssnj	void *ptr;
8319a906b70Schristos	int err;
8329a906b70Schristos
83303b705cfSriastradh	assert(bo->refcnt);
83403b705cfSriastradh	assert(bo->proxy == NULL);
83503b705cfSriastradh	ASSERT_IDLE(kgem, bo->handle);
83603b705cfSriastradh
83703b705cfSriastradh	assert(length <= bytes(bo));
8389a906b70Schristosretry:
839813957e3Ssnj	ptr = NULL;
840813957e3Ssnj	if (bo->domain == DOMAIN_CPU || (kgem->has_llc && !bo->scanout)) {
841813957e3Ssnj		ptr = bo->map__cpu;
842813957e3Ssnj		if (ptr == NULL)
843813957e3Ssnj			ptr = __kgem_bo_map__cpu(kgem, bo);
844813957e3Ssnj	} else if (kgem->has_wc_mmap) {
845813957e3Ssnj		ptr = bo->map__wc;
846813957e3Ssnj		if (ptr == NULL)
847813957e3Ssnj			ptr = __kgem_bo_map__wc(kgem, bo);
848813957e3Ssnj	}
849813957e3Ssnj	if (ptr) {
850813957e3Ssnj		/* XXX unsynchronized? */
851813957e3Ssnj		memcpy(ptr, data, length);
852813957e3Ssnj		return true;
853813957e3Ssnj	}
854813957e3Ssnj
8559a906b70Schristos	if ((err = gem_write(kgem->fd, bo->handle, 0, length, data))) {
85663ef14f0Smrg		DBG(("%s: failed %d, throttling/cleaning caches\n",
85763ef14f0Smrg		     __FUNCTION__, err));
8589a906b70Schristos		assert(err != EINVAL);
8599a906b70Schristos
8609a906b70Schristos		(void)__kgem_throttle_retire(kgem, 0);
8619a906b70Schristos		if (kgem_expire_cache(kgem))
8629a906b70Schristos			goto retry;
8639a906b70Schristos
8649a906b70Schristos		if (kgem_cleanup_cache(kgem))
8659a906b70Schristos			goto retry;
8669a906b70Schristos
8679a906b70Schristos		ERR(("%s: failed to write %d bytes into BO handle=%d: %d\n",
8689a906b70Schristos		     __FUNCTION__, length, bo->handle, -err));
86903b705cfSriastradh		return false;
8709a906b70Schristos	}
87103b705cfSriastradh
87203b705cfSriastradh	DBG(("%s: flush=%d, domain=%d\n", __FUNCTION__, bo->flush, bo->domain));
8739a906b70Schristos	if (bo->exec == NULL)
8749a906b70Schristos		kgem_bo_maybe_retire(kgem, bo);
8759a906b70Schristos	bo->domain = DOMAIN_NONE;
87603b705cfSriastradh	bo->gtt_dirty = true;
87703b705cfSriastradh	return true;
87803b705cfSriastradh}
87903b705cfSriastradh
88003b705cfSriastradhstatic uint32_t gem_create(int fd, int num_pages)
88103b705cfSriastradh{
88203b705cfSriastradh	struct drm_i915_gem_create create;
88303b705cfSriastradh
88403b705cfSriastradh	VG_CLEAR(create);
88503b705cfSriastradh	create.handle = 0;
88603b705cfSriastradh	create.size = PAGE_SIZE * num_pages;
8879a906b70Schristos	(void)do_ioctl(fd, DRM_IOCTL_I915_GEM_CREATE, &create);
88803b705cfSriastradh
88903b705cfSriastradh	return create.handle;
89003b705cfSriastradh}
89103b705cfSriastradh
89263ef14f0Smrgstatic void
89303b705cfSriastradhkgem_bo_set_purgeable(struct kgem *kgem, struct kgem_bo *bo)
89403b705cfSriastradh{
89563ef14f0Smrg#if !DBG_NO_MADV
89603b705cfSriastradh	struct drm_i915_gem_madvise madv;
89703b705cfSriastradh
89803b705cfSriastradh	assert(bo->exec == NULL);
89903b705cfSriastradh
90003b705cfSriastradh	VG_CLEAR(madv);
90103b705cfSriastradh	madv.handle = bo->handle;
90203b705cfSriastradh	madv.madv = I915_MADV_DONTNEED;
9039a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MADVISE, &madv) == 0) {
90463ef14f0Smrg		bo->purged = true;
90563ef14f0Smrg		kgem->need_purge |= !madv.retained && bo->domain != DOMAIN_CPU;
90603b705cfSriastradh	}
90703b705cfSriastradh#endif
90803b705cfSriastradh}
90903b705cfSriastradh
91003b705cfSriastradhstatic bool
91103b705cfSriastradhkgem_bo_is_retained(struct kgem *kgem, struct kgem_bo *bo)
91203b705cfSriastradh{
91303b705cfSriastradh#if DBG_NO_MADV
91403b705cfSriastradh	return true;
91503b705cfSriastradh#else
91603b705cfSriastradh	struct drm_i915_gem_madvise madv;
91703b705cfSriastradh
91803b705cfSriastradh	if (!bo->purged)
91903b705cfSriastradh		return true;
92003b705cfSriastradh
92103b705cfSriastradh	VG_CLEAR(madv);
92203b705cfSriastradh	madv.handle = bo->handle;
92303b705cfSriastradh	madv.madv = I915_MADV_DONTNEED;
9249a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MADVISE, &madv) == 0)
92503b705cfSriastradh		return madv.retained;
92603b705cfSriastradh
92703b705cfSriastradh	return false;
92803b705cfSriastradh#endif
92903b705cfSriastradh}
93003b705cfSriastradh
93103b705cfSriastradhstatic bool
93203b705cfSriastradhkgem_bo_clear_purgeable(struct kgem *kgem, struct kgem_bo *bo)
93303b705cfSriastradh{
93403b705cfSriastradh#if DBG_NO_MADV
93503b705cfSriastradh	return true;
93603b705cfSriastradh#else
93703b705cfSriastradh	struct drm_i915_gem_madvise madv;
93803b705cfSriastradh
93903b705cfSriastradh	assert(bo->purged);
94003b705cfSriastradh
94103b705cfSriastradh	VG_CLEAR(madv);
94203b705cfSriastradh	madv.handle = bo->handle;
94303b705cfSriastradh	madv.madv = I915_MADV_WILLNEED;
9449a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MADVISE, &madv) == 0) {
94503b705cfSriastradh		bo->purged = !madv.retained;
94663ef14f0Smrg		kgem->need_purge |= !madv.retained && bo->domain != DOMAIN_CPU;
94703b705cfSriastradh		return madv.retained;
94803b705cfSriastradh	}
94903b705cfSriastradh
95003b705cfSriastradh	return false;
95103b705cfSriastradh#endif
95203b705cfSriastradh}
95303b705cfSriastradh
95403b705cfSriastradhstatic void gem_close(int fd, uint32_t handle)
95503b705cfSriastradh{
95603b705cfSriastradh	struct drm_gem_close close;
95703b705cfSriastradh
95803b705cfSriastradh	VG_CLEAR(close);
95903b705cfSriastradh	close.handle = handle;
9609a906b70Schristos	(void)do_ioctl(fd, DRM_IOCTL_GEM_CLOSE, &close);
96103b705cfSriastradh}
96203b705cfSriastradh
96303b705cfSriastradhconstant inline static unsigned long __fls(unsigned long word)
96403b705cfSriastradh{
96503b705cfSriastradh#if defined(__GNUC__) && (defined(__i386__) || defined(__x86__) || defined(__x86_64__))
96603b705cfSriastradh	asm("bsr %1,%0"
96703b705cfSriastradh	    : "=r" (word)
96803b705cfSriastradh	    : "rm" (word));
96903b705cfSriastradh	return word;
97003b705cfSriastradh#else
97103b705cfSriastradh	unsigned int v = 0;
97203b705cfSriastradh
97303b705cfSriastradh	while (word >>= 1)
97403b705cfSriastradh		v++;
97503b705cfSriastradh
97603b705cfSriastradh	return v;
97703b705cfSriastradh#endif
97803b705cfSriastradh}
97903b705cfSriastradh
98003b705cfSriastradhconstant inline static int cache_bucket(int num_pages)
98103b705cfSriastradh{
98203b705cfSriastradh	return __fls(num_pages);
98303b705cfSriastradh}
98403b705cfSriastradh
98503b705cfSriastradhstatic struct kgem_bo *__kgem_bo_init(struct kgem_bo *bo,
98603b705cfSriastradh				      int handle, int num_pages)
98703b705cfSriastradh{
9889a906b70Schristos	DBG(("%s(handle=%d, num_pages=%d)\n", __FUNCTION__, handle, num_pages));
9899a906b70Schristos
99003b705cfSriastradh	assert(num_pages);
99103b705cfSriastradh	memset(bo, 0, sizeof(*bo));
99203b705cfSriastradh
99303b705cfSriastradh	bo->refcnt = 1;
99403b705cfSriastradh	bo->handle = handle;
99503b705cfSriastradh	bo->target_handle = -1;
99603b705cfSriastradh	num_pages(bo) = num_pages;
99703b705cfSriastradh	bucket(bo) = cache_bucket(num_pages);
99803b705cfSriastradh	bo->reusable = true;
99903b705cfSriastradh	bo->domain = DOMAIN_CPU;
100003b705cfSriastradh	list_init(&bo->request);
100103b705cfSriastradh	list_init(&bo->list);
100203b705cfSriastradh	list_init(&bo->vma);
100303b705cfSriastradh
100403b705cfSriastradh	return bo;
100503b705cfSriastradh}
100603b705cfSriastradh
100703b705cfSriastradhstatic struct kgem_bo *__kgem_bo_alloc(int handle, int num_pages)
100803b705cfSriastradh{
100903b705cfSriastradh	struct kgem_bo *bo;
101003b705cfSriastradh
101103b705cfSriastradh	if (__kgem_freed_bo) {
101203b705cfSriastradh		bo = __kgem_freed_bo;
101303b705cfSriastradh		__kgem_freed_bo = *(struct kgem_bo **)bo;
101403b705cfSriastradh	} else {
101503b705cfSriastradh		bo = malloc(sizeof(*bo));
101603b705cfSriastradh		if (bo == NULL)
101703b705cfSriastradh			return NULL;
101803b705cfSriastradh	}
101903b705cfSriastradh
102003b705cfSriastradh	return __kgem_bo_init(bo, handle, num_pages);
102103b705cfSriastradh}
102203b705cfSriastradh
102303b705cfSriastradhstatic struct kgem_request *__kgem_request_alloc(struct kgem *kgem)
102403b705cfSriastradh{
102503b705cfSriastradh	struct kgem_request *rq;
102603b705cfSriastradh
102763ef14f0Smrg	if (unlikely(kgem->wedged)) {
102863ef14f0Smrg		rq = &kgem->static_request;
102903b705cfSriastradh	} else {
103063ef14f0Smrg		rq = __kgem_freed_request;
103163ef14f0Smrg		if (rq) {
103263ef14f0Smrg			__kgem_freed_request = *(struct kgem_request **)rq;
103363ef14f0Smrg		} else {
103463ef14f0Smrg			rq = malloc(sizeof(*rq));
103563ef14f0Smrg			if (rq == NULL)
103663ef14f0Smrg				rq = &kgem->static_request;
103763ef14f0Smrg		}
103803b705cfSriastradh	}
103903b705cfSriastradh
104003b705cfSriastradh	list_init(&rq->buffers);
104103b705cfSriastradh	rq->bo = NULL;
104203b705cfSriastradh	rq->ring = 0;
104303b705cfSriastradh
104403b705cfSriastradh	return rq;
104503b705cfSriastradh}
104603b705cfSriastradh
104703b705cfSriastradhstatic void __kgem_request_free(struct kgem_request *rq)
104803b705cfSriastradh{
104903b705cfSriastradh	_list_del(&rq->list);
10509a906b70Schristos	if (DBG_NO_MALLOC_CACHE) {
10519a906b70Schristos		free(rq);
10529a906b70Schristos	} else {
10539a906b70Schristos		*(struct kgem_request **)rq = __kgem_freed_request;
10549a906b70Schristos		__kgem_freed_request = rq;
10559a906b70Schristos	}
105603b705cfSriastradh}
105703b705cfSriastradh
105803b705cfSriastradhstatic struct list *inactive(struct kgem *kgem, int num_pages)
105903b705cfSriastradh{
106003b705cfSriastradh	assert(num_pages < MAX_CACHE_SIZE / PAGE_SIZE);
106103b705cfSriastradh	assert(cache_bucket(num_pages) < NUM_CACHE_BUCKETS);
106203b705cfSriastradh	return &kgem->inactive[cache_bucket(num_pages)];
106303b705cfSriastradh}
106403b705cfSriastradh
106503b705cfSriastradhstatic struct list *active(struct kgem *kgem, int num_pages, int tiling)
106603b705cfSriastradh{
106703b705cfSriastradh	assert(num_pages < MAX_CACHE_SIZE / PAGE_SIZE);
106803b705cfSriastradh	assert(cache_bucket(num_pages) < NUM_CACHE_BUCKETS);
106903b705cfSriastradh	return &kgem->active[cache_bucket(num_pages)][tiling];
107003b705cfSriastradh}
107103b705cfSriastradh
107203b705cfSriastradhstatic size_t
107303b705cfSriastradhagp_aperture_size(struct pci_device *dev, unsigned gen)
107403b705cfSriastradh{
107503b705cfSriastradh	/* XXX assume that only future chipsets are unknown and follow
107603b705cfSriastradh	 * the post gen2 PCI layout.
107703b705cfSriastradh	 */
107803b705cfSriastradh	return dev->regions[gen < 030 ? 0 : 2].size;
107903b705cfSriastradh}
108003b705cfSriastradh
108103b705cfSriastradhstatic size_t
108203b705cfSriastradhtotal_ram_size(void)
108303b705cfSriastradh{
108403b705cfSriastradh#ifdef HAVE_STRUCT_SYSINFO_TOTALRAM
108503b705cfSriastradh	struct sysinfo info;
108603b705cfSriastradh	if (sysinfo(&info) == 0)
108763ef14f0Smrg		return (size_t)info.totalram * info.mem_unit;
108803b705cfSriastradh#endif
108903b705cfSriastradh
109003b705cfSriastradh#ifdef _SC_PHYS_PAGES
109163ef14f0Smrg	 return (size_t)sysconf(_SC_PHYS_PAGES) * sysconf(_SC_PAGE_SIZE);
109203b705cfSriastradh#endif
109303b705cfSriastradh
109403b705cfSriastradh	return 0;
109503b705cfSriastradh}
109603b705cfSriastradh
109703b705cfSriastradhstatic unsigned
109803b705cfSriastradhcpu_cache_size__cpuid4(void)
109903b705cfSriastradh{
11009a906b70Schristos	/* Deterministic Cache Parameters (Function 04h)":
110103b705cfSriastradh	 *    When EAX is initialized to a value of 4, the CPUID instruction
110203b705cfSriastradh	 *    returns deterministic cache information in the EAX, EBX, ECX
110303b705cfSriastradh	 *    and EDX registers.  This function requires ECX be initialized
110403b705cfSriastradh	 *    with an index which indicates which cache to return information
110503b705cfSriastradh	 *    about. The OS is expected to call this function (CPUID.4) with
110603b705cfSriastradh	 *    ECX = 0, 1, 2, until EAX[4:0] == 0, indicating no more caches.
110703b705cfSriastradh	 *    The order in which the caches are returned is not specified
110803b705cfSriastradh	 *    and may change at Intel's discretion.
110903b705cfSriastradh	 *
111003b705cfSriastradh	 * Calculating the Cache Size in bytes:
111103b705cfSriastradh	 *          = (Ways +1) * (Partitions +1) * (Line Size +1) * (Sets +1)
111203b705cfSriastradh	 */
111303b705cfSriastradh
111403b705cfSriastradh	 unsigned int eax, ebx, ecx, edx;
111503b705cfSriastradh	 unsigned int llc_size = 0;
11169a906b70Schristos	 int cnt;
111703b705cfSriastradh
111803b705cfSriastradh	 if (__get_cpuid_max(BASIC_CPUID, NULL) < 4)
111903b705cfSriastradh		 return 0;
112003b705cfSriastradh
11219a906b70Schristos	 cnt = 0;
112203b705cfSriastradh	 do {
112303b705cfSriastradh		 unsigned associativity, line_partitions, line_size, sets;
112403b705cfSriastradh
112503b705cfSriastradh		 __cpuid_count(4, cnt++, eax, ebx, ecx, edx);
112603b705cfSriastradh
112703b705cfSriastradh		 if ((eax & 0x1f) == 0)
112803b705cfSriastradh			 break;
112903b705cfSriastradh
113003b705cfSriastradh		 associativity = ((ebx >> 22) & 0x3ff) + 1;
113103b705cfSriastradh		 line_partitions = ((ebx >> 12) & 0x3ff) + 1;
113203b705cfSriastradh		 line_size = (ebx & 0xfff) + 1;
113303b705cfSriastradh		 sets = ecx + 1;
113403b705cfSriastradh
113503b705cfSriastradh		 llc_size = associativity * line_partitions * line_size * sets;
113603b705cfSriastradh	 } while (1);
113703b705cfSriastradh
113803b705cfSriastradh	 return llc_size;
113903b705cfSriastradh}
114003b705cfSriastradh
114103b705cfSriastradhstatic unsigned
114203b705cfSriastradhcpu_cache_size(void)
114303b705cfSriastradh{
114403b705cfSriastradh	unsigned size;
114503b705cfSriastradh	FILE *file;
114603b705cfSriastradh
114703b705cfSriastradh	size = cpu_cache_size__cpuid4();
114803b705cfSriastradh	if (size)
114903b705cfSriastradh		return size;
115003b705cfSriastradh
115103b705cfSriastradh	file = fopen("/proc/cpuinfo", "r");
115203b705cfSriastradh	if (file) {
115303b705cfSriastradh		size_t len = 0;
115403b705cfSriastradh		char *line = NULL;
115503b705cfSriastradh		while (getline(&line, &len, file) != -1) {
115603b705cfSriastradh			int kb;
115703b705cfSriastradh			if (sscanf(line, "cache size : %d KB", &kb) == 1) {
115803b705cfSriastradh				/* Paranoid check against gargantuan caches */
115903b705cfSriastradh				if (kb <= 1<<20)
116003b705cfSriastradh					size = kb * 1024;
116103b705cfSriastradh				break;
116203b705cfSriastradh			}
116303b705cfSriastradh		}
116403b705cfSriastradh		free(line);
116503b705cfSriastradh		fclose(file);
116603b705cfSriastradh	}
116703b705cfSriastradh
116803b705cfSriastradh	if (size == 0)
116903b705cfSriastradh		size = 64 * 1024;
117003b705cfSriastradh
117103b705cfSriastradh	return size;
117203b705cfSriastradh}
117303b705cfSriastradh
117403b705cfSriastradhstatic int gem_param(struct kgem *kgem, int name)
117503b705cfSriastradh{
117603b705cfSriastradh	drm_i915_getparam_t gp;
117703b705cfSriastradh	int v = -1; /* No param uses the sign bit, reserve it for errors */
117803b705cfSriastradh
117903b705cfSriastradh	VG_CLEAR(gp);
118003b705cfSriastradh	gp.param = name;
118103b705cfSriastradh	gp.value = &v;
11829a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GETPARAM, &gp))
118303b705cfSriastradh		return -1;
118403b705cfSriastradh
118503b705cfSriastradh	VG(VALGRIND_MAKE_MEM_DEFINED(&v, sizeof(v)));
118603b705cfSriastradh	return v;
118703b705cfSriastradh}
118803b705cfSriastradh
118903b705cfSriastradhstatic bool test_has_execbuffer2(struct kgem *kgem)
119003b705cfSriastradh{
119103b705cfSriastradh	struct drm_i915_gem_execbuffer2 execbuf;
119203b705cfSriastradh
119303b705cfSriastradh	memset(&execbuf, 0, sizeof(execbuf));
119403b705cfSriastradh	execbuf.buffer_count = 1;
119503b705cfSriastradh
11969a906b70Schristos	return do_ioctl(kgem->fd,
119703b705cfSriastradh			 DRM_IOCTL_I915_GEM_EXECBUFFER2,
11989a906b70Schristos			 &execbuf) == -EFAULT;
119903b705cfSriastradh}
120003b705cfSriastradh
120103b705cfSriastradhstatic bool test_has_no_reloc(struct kgem *kgem)
120203b705cfSriastradh{
120303b705cfSriastradh	if (DBG_NO_FAST_RELOC)
120403b705cfSriastradh		return false;
120503b705cfSriastradh
120603b705cfSriastradh	return gem_param(kgem, LOCAL_I915_PARAM_HAS_NO_RELOC) > 0;
120703b705cfSriastradh}
120803b705cfSriastradh
120903b705cfSriastradhstatic bool test_has_handle_lut(struct kgem *kgem)
121003b705cfSriastradh{
121103b705cfSriastradh	if (DBG_NO_HANDLE_LUT)
121203b705cfSriastradh		return false;
121303b705cfSriastradh
121403b705cfSriastradh	return gem_param(kgem, LOCAL_I915_PARAM_HAS_HANDLE_LUT) > 0;
121503b705cfSriastradh}
121603b705cfSriastradh
121703b705cfSriastradhstatic bool test_has_wt(struct kgem *kgem)
121803b705cfSriastradh{
121903b705cfSriastradh	if (DBG_NO_WT)
122003b705cfSriastradh		return false;
122103b705cfSriastradh
122203b705cfSriastradh	return gem_param(kgem, LOCAL_I915_PARAM_HAS_WT) > 0;
122303b705cfSriastradh}
122403b705cfSriastradh
122503b705cfSriastradhstatic bool test_has_semaphores_enabled(struct kgem *kgem)
122603b705cfSriastradh{
122703b705cfSriastradh	FILE *file;
122803b705cfSriastradh	bool detected = false;
122903b705cfSriastradh	int ret;
123003b705cfSriastradh
123103b705cfSriastradh	if (DBG_NO_SEMAPHORES)
123203b705cfSriastradh		return false;
123303b705cfSriastradh
123403b705cfSriastradh	ret = gem_param(kgem, LOCAL_I915_PARAM_HAS_SEMAPHORES);
123503b705cfSriastradh	if (ret != -1)
123603b705cfSriastradh		return ret > 0;
123703b705cfSriastradh
123803b705cfSriastradh	file = fopen("/sys/module/i915/parameters/semaphores", "r");
123903b705cfSriastradh	if (file) {
124003b705cfSriastradh		int value;
124103b705cfSriastradh		if (fscanf(file, "%d", &value) == 1)
124203b705cfSriastradh			detected = value != 0;
124303b705cfSriastradh		fclose(file);
124403b705cfSriastradh	}
124503b705cfSriastradh
124603b705cfSriastradh	return detected;
124703b705cfSriastradh}
124803b705cfSriastradh
124903b705cfSriastradhstatic bool is_hw_supported(struct kgem *kgem,
125003b705cfSriastradh			    struct pci_device *dev)
125103b705cfSriastradh{
125203b705cfSriastradh	if (DBG_NO_HW)
125303b705cfSriastradh		return false;
125403b705cfSriastradh
125503b705cfSriastradh	if (!test_has_execbuffer2(kgem))
125603b705cfSriastradh		return false;
125703b705cfSriastradh
125803b705cfSriastradh	if (kgem->gen == (unsigned)-1) /* unknown chipset, assume future gen */
125903b705cfSriastradh		return kgem->has_blt;
126003b705cfSriastradh
126103b705cfSriastradh	/* Although pre-855gm the GMCH is fubar, it works mostly. So
126203b705cfSriastradh	 * let the user decide through "NoAccel" whether or not to risk
126303b705cfSriastradh	 * hw acceleration.
126403b705cfSriastradh	 */
126503b705cfSriastradh
12669a906b70Schristos	if (kgem->gen == 060 && dev && dev->revision < 8) {
126703b705cfSriastradh		/* pre-production SNB with dysfunctional BLT */
126803b705cfSriastradh		return false;
126903b705cfSriastradh	}
127003b705cfSriastradh
127103b705cfSriastradh	if (kgem->gen >= 060) /* Only if the kernel supports the BLT ring */
127203b705cfSriastradh		return kgem->has_blt;
127303b705cfSriastradh
127403b705cfSriastradh	return true;
127503b705cfSriastradh}
127603b705cfSriastradh
127703b705cfSriastradhstatic bool test_has_relaxed_fencing(struct kgem *kgem)
127803b705cfSriastradh{
127903b705cfSriastradh	if (kgem->gen < 040) {
128003b705cfSriastradh		if (DBG_NO_RELAXED_FENCING)
128103b705cfSriastradh			return false;
128203b705cfSriastradh
128303b705cfSriastradh		return gem_param(kgem, LOCAL_I915_PARAM_HAS_RELAXED_FENCING) > 0;
128403b705cfSriastradh	} else
128503b705cfSriastradh		return true;
128603b705cfSriastradh}
128703b705cfSriastradh
128863ef14f0Smrgstatic bool test_has_coherent_mmap_gtt(struct kgem *kgem)
128963ef14f0Smrg{
129063ef14f0Smrg	if (DBG_NO_COHERENT_MMAP_GTT)
129163ef14f0Smrg		return false;
129263ef14f0Smrg
129363ef14f0Smrg	return gem_param(kgem, LOCAL_I915_PARAM_MMAP_GTT_COHERENT) > 0;
129463ef14f0Smrg}
129563ef14f0Smrg
129603b705cfSriastradhstatic bool test_has_llc(struct kgem *kgem)
129703b705cfSriastradh{
129803b705cfSriastradh	int has_llc = -1;
129903b705cfSriastradh
130003b705cfSriastradh	if (DBG_NO_LLC)
130103b705cfSriastradh		return false;
130203b705cfSriastradh
1303813957e3Ssnj	has_llc = gem_param(kgem, LOCAL_I915_PARAM_HAS_LLC);
130403b705cfSriastradh	if (has_llc == -1) {
130503b705cfSriastradh		DBG(("%s: no kernel/drm support for HAS_LLC, assuming support for LLC based on GPU generation\n", __FUNCTION__));
130603b705cfSriastradh		has_llc = kgem->gen >= 060;
130703b705cfSriastradh	}
130803b705cfSriastradh
130903b705cfSriastradh	return has_llc;
131003b705cfSriastradh}
131103b705cfSriastradh
1312813957e3Ssnjstatic bool test_has_wc_mmap(struct kgem *kgem)
1313813957e3Ssnj{
1314813957e3Ssnj	struct local_i915_gem_mmap2 wc;
1315813957e3Ssnj	bool ret;
1316813957e3Ssnj
1317813957e3Ssnj	if (DBG_NO_WC_MMAP)
1318813957e3Ssnj		return false;
1319813957e3Ssnj
132063ef14f0Smrg	/* XXX See https://bugs.freedesktop.org/show_bug.cgi?id=90841 */
132163ef14f0Smrg	if (kgem->gen < 033)
132263ef14f0Smrg		return false;
132363ef14f0Smrg
1324813957e3Ssnj	if (gem_param(kgem, LOCAL_I915_PARAM_MMAP_VERSION) < 1)
1325813957e3Ssnj		return false;
1326813957e3Ssnj
1327813957e3Ssnj	VG_CLEAR(wc);
1328813957e3Ssnj	wc.handle = gem_create(kgem->fd, 1);
1329813957e3Ssnj	wc.offset = 0;
1330813957e3Ssnj	wc.size = 4096;
1331813957e3Ssnj	wc.flags = I915_MMAP_WC;
1332813957e3Ssnj	ret = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_MMAP_v2, &wc) == 0;
1333813957e3Ssnj	gem_close(kgem->fd, wc.handle);
1334813957e3Ssnj
1335813957e3Ssnj	return ret;
1336813957e3Ssnj}
1337813957e3Ssnj
133803b705cfSriastradhstatic bool test_has_caching(struct kgem *kgem)
133903b705cfSriastradh{
134003b705cfSriastradh	uint32_t handle;
134103b705cfSriastradh	bool ret;
134203b705cfSriastradh
134303b705cfSriastradh	if (DBG_NO_CACHE_LEVEL)
134403b705cfSriastradh		return false;
134503b705cfSriastradh
134603b705cfSriastradh	/* Incoherent blt and sampler hangs the GPU */
134703b705cfSriastradh	if (kgem->gen == 040)
134803b705cfSriastradh		return false;
134903b705cfSriastradh
135003b705cfSriastradh	handle = gem_create(kgem->fd, 1);
135103b705cfSriastradh	if (handle == 0)
135203b705cfSriastradh		return false;
135303b705cfSriastradh
135403b705cfSriastradh	ret = gem_set_caching(kgem->fd, handle, UNCACHED);
135503b705cfSriastradh	gem_close(kgem->fd, handle);
135603b705cfSriastradh	return ret;
135703b705cfSriastradh}
135803b705cfSriastradh
135903b705cfSriastradhstatic bool test_has_userptr(struct kgem *kgem)
136003b705cfSriastradh{
136163ef14f0Smrg	struct local_i915_gem_userptr arg;
136203b705cfSriastradh	void *ptr;
136303b705cfSriastradh
136403b705cfSriastradh	if (DBG_NO_USERPTR)
136503b705cfSriastradh		return false;
136603b705cfSriastradh
136703b705cfSriastradh	/* Incoherent blt and sampler hangs the GPU */
136803b705cfSriastradh	if (kgem->gen == 040)
136903b705cfSriastradh		return false;
137003b705cfSriastradh
137103b705cfSriastradh	if (posix_memalign(&ptr, PAGE_SIZE, PAGE_SIZE))
137203b705cfSriastradh		return false;
137303b705cfSriastradh
137463ef14f0Smrg	VG_CLEAR(arg);
137563ef14f0Smrg	arg.user_ptr = (uintptr_t)ptr;
137663ef14f0Smrg	arg.user_size = PAGE_SIZE;
137763ef14f0Smrg	arg.flags = I915_USERPTR_UNSYNCHRONIZED;
137803b705cfSriastradh
137963ef14f0Smrg	if (DBG_NO_UNSYNCHRONIZED_USERPTR ||
138063ef14f0Smrg	    do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg)) {
138163ef14f0Smrg		arg.flags &= ~I915_USERPTR_UNSYNCHRONIZED;
138263ef14f0Smrg		if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg))
138363ef14f0Smrg			arg.handle = 0;
138463ef14f0Smrg		/* Leak the userptr bo to keep the mmu_notifier alive */
138563ef14f0Smrg	} else {
138663ef14f0Smrg		gem_close(kgem->fd, arg.handle);
138763ef14f0Smrg		free(ptr);
138863ef14f0Smrg	}
138963ef14f0Smrg
139063ef14f0Smrg	return arg.handle != 0;
139103b705cfSriastradh}
139203b705cfSriastradh
139303b705cfSriastradhstatic bool test_has_create2(struct kgem *kgem)
139403b705cfSriastradh{
139503b705cfSriastradh#if defined(USE_CREATE2)
139603b705cfSriastradh	struct local_i915_gem_create2 args;
139703b705cfSriastradh
139803b705cfSriastradh	if (DBG_NO_CREATE2)
139903b705cfSriastradh		return false;
140003b705cfSriastradh
140103b705cfSriastradh	memset(&args, 0, sizeof(args));
140203b705cfSriastradh	args.size = PAGE_SIZE;
140303b705cfSriastradh	args.caching = DISPLAY;
14049a906b70Schristos	if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_CREATE2, &args) == 0)
140503b705cfSriastradh		gem_close(kgem->fd, args.handle);
140603b705cfSriastradh
140703b705cfSriastradh	return args.handle != 0;
140803b705cfSriastradh#else
140903b705cfSriastradh	return false;
141003b705cfSriastradh#endif
141103b705cfSriastradh}
141203b705cfSriastradh
141363ef14f0Smrgstatic bool test_can_blt_y(struct kgem *kgem)
141403b705cfSriastradh{
141563ef14f0Smrg	struct drm_i915_gem_exec_object2 object;
141663ef14f0Smrg	uint32_t batch[] = {
141763ef14f0Smrg#define MI_LOAD_REGISTER_IMM (0x22<<23 | (3-2))
141863ef14f0Smrg#define BCS_SWCTRL 0x22200
141963ef14f0Smrg#define BCS_SRC_Y (1 << 0)
142063ef14f0Smrg#define BCS_DST_Y (1 << 1)
142163ef14f0Smrg		MI_LOAD_REGISTER_IMM,
142263ef14f0Smrg		BCS_SWCTRL,
142363ef14f0Smrg		(BCS_SRC_Y | BCS_DST_Y) << 16 | (BCS_SRC_Y | BCS_DST_Y),
142463ef14f0Smrg
142563ef14f0Smrg		MI_LOAD_REGISTER_IMM,
142663ef14f0Smrg		BCS_SWCTRL,
142763ef14f0Smrg		(BCS_SRC_Y | BCS_DST_Y) << 16,
142863ef14f0Smrg
142963ef14f0Smrg		MI_BATCH_BUFFER_END,
143063ef14f0Smrg		0,
143163ef14f0Smrg	};
143263ef14f0Smrg	int ret;
143363ef14f0Smrg
143463ef14f0Smrg	if (DBG_NO_BLT_Y)
143503b705cfSriastradh		return false;
143603b705cfSriastradh
143763ef14f0Smrg	if (kgem->gen < 060)
143863ef14f0Smrg		return false;
143963ef14f0Smrg
144063ef14f0Smrg	memset(&object, 0, sizeof(object));
144163ef14f0Smrg	object.handle = gem_create(kgem->fd, 1);
144263ef14f0Smrg
144363ef14f0Smrg	ret = gem_write(kgem->fd, object.handle, 0, sizeof(batch), batch);
144463ef14f0Smrg	if (ret == 0) {
144563ef14f0Smrg		struct drm_i915_gem_execbuffer2 execbuf;
144663ef14f0Smrg
144763ef14f0Smrg		memset(&execbuf, 0, sizeof(execbuf));
144863ef14f0Smrg		execbuf.buffers_ptr = (uintptr_t)&object;
144963ef14f0Smrg		execbuf.buffer_count = 1;
145063ef14f0Smrg		execbuf.flags = KGEM_BLT;
145163ef14f0Smrg
145263ef14f0Smrg		ret = do_ioctl(kgem->fd,
145363ef14f0Smrg			       DRM_IOCTL_I915_GEM_EXECBUFFER2,
145463ef14f0Smrg			       &execbuf);
145563ef14f0Smrg	}
145663ef14f0Smrg	gem_close(kgem->fd, object.handle);
145763ef14f0Smrg
145863ef14f0Smrg	return ret == 0;
145903b705cfSriastradh}
146003b705cfSriastradh
146163ef14f0Smrgstatic bool gem_set_tiling(int fd, uint32_t handle, int tiling, int stride)
146203b705cfSriastradh{
146363ef14f0Smrg	struct drm_i915_gem_set_tiling set_tiling;
146463ef14f0Smrg
146563ef14f0Smrg	if (DBG_NO_TILING)
146603b705cfSriastradh		return false;
146703b705cfSriastradh
146863ef14f0Smrg	VG_CLEAR(set_tiling);
146963ef14f0Smrg	set_tiling.handle = handle;
147063ef14f0Smrg	set_tiling.tiling_mode = tiling;
147163ef14f0Smrg	set_tiling.stride = stride;
147263ef14f0Smrg
147363ef14f0Smrg	if (ioctl(fd, DRM_IOCTL_I915_GEM_SET_TILING, &set_tiling) == 0)
147463ef14f0Smrg		return set_tiling.tiling_mode == tiling;
147563ef14f0Smrg
147663ef14f0Smrg	return false;
147703b705cfSriastradh}
147803b705cfSriastradh
147963ef14f0Smrgstatic bool test_can_scanout_y(struct kgem *kgem)
148003b705cfSriastradh{
148163ef14f0Smrg	struct drm_mode_fb_cmd arg;
148263ef14f0Smrg	bool ret = false;
148363ef14f0Smrg
148463ef14f0Smrg	if (DBG_NO_SCANOUT_Y)
148563ef14f0Smrg		return false;
148663ef14f0Smrg
148763ef14f0Smrg	VG_CLEAR(arg);
148863ef14f0Smrg	arg.width = 32;
148963ef14f0Smrg	arg.height = 32;
149063ef14f0Smrg	arg.pitch = 4*32;
149163ef14f0Smrg	arg.bpp = 32;
149263ef14f0Smrg	arg.depth = 24;
149363ef14f0Smrg	arg.handle = gem_create(kgem->fd, 1);
149463ef14f0Smrg
149563ef14f0Smrg	if (gem_set_tiling(kgem->fd, arg.handle, I915_TILING_Y, arg.pitch))
149663ef14f0Smrg		ret = do_ioctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &arg) == 0;
149763ef14f0Smrg	if (!ret) {
149863ef14f0Smrg		struct local_mode_fb_cmd2 {
149963ef14f0Smrg			uint32_t fb_id;
150063ef14f0Smrg			uint32_t width, height;
150163ef14f0Smrg			uint32_t pixel_format;
150263ef14f0Smrg			uint32_t flags;
150363ef14f0Smrg
150463ef14f0Smrg			uint32_t handles[4];
150563ef14f0Smrg			uint32_t pitches[4];
150663ef14f0Smrg			uint32_t offsets[4];
150763ef14f0Smrg			uint64_t modifiers[4];
150863ef14f0Smrg		} f;
150963ef14f0Smrg#define LOCAL_IOCTL_MODE_ADDFB2 DRM_IOWR(0xb8, struct local_mode_fb_cmd2)
151063ef14f0Smrg		memset(&f, 0, sizeof(f));
151163ef14f0Smrg		f.width = arg.width;
151263ef14f0Smrg		f.height = arg.height;
151363ef14f0Smrg		f.handles[0] = arg.handle;
151463ef14f0Smrg		f.pitches[0] = arg.pitch;
151563ef14f0Smrg		f.modifiers[0] = (uint64_t)1 << 56 | 2; /* MOD_Y_TILED */
151663ef14f0Smrg		f.pixel_format = 'X' | 'R' << 8 | '2' << 16 | '4' << 24; /* XRGB8888 */
151763ef14f0Smrg		f.flags = 1 << 1; /* + modifier */
151863ef14f0Smrg		if (drmIoctl(kgem->fd, LOCAL_IOCTL_MODE_ADDFB2, &f) == 0) {
151963ef14f0Smrg			ret = true;
152063ef14f0Smrg			arg.fb_id = f.fb_id;
152163ef14f0Smrg		}
152263ef14f0Smrg	}
152363ef14f0Smrg	do_ioctl(kgem->fd, DRM_IOCTL_MODE_RMFB, &arg.fb_id);
152463ef14f0Smrg	gem_close(kgem->fd, arg.handle);
152563ef14f0Smrg
152663ef14f0Smrg	return ret;
152703b705cfSriastradh}
152803b705cfSriastradh
152963ef14f0Smrgstatic bool test_has_dirtyfb(struct kgem *kgem)
15309a906b70Schristos{
153163ef14f0Smrg	struct drm_mode_fb_cmd create;
153263ef14f0Smrg	bool ret = false;
15339a906b70Schristos
153463ef14f0Smrg	if (DBG_NO_DIRTYFB)
153563ef14f0Smrg		return false;
15369a906b70Schristos
153763ef14f0Smrg	VG_CLEAR(create);
153863ef14f0Smrg	create.width = 32;
153963ef14f0Smrg	create.height = 32;
154063ef14f0Smrg	create.pitch = 4*32;
154163ef14f0Smrg	create.bpp = 24;
154263ef14f0Smrg	create.depth = 32; /* {bpp:24, depth:32} -> x8r8g8b8 */
154363ef14f0Smrg	create.handle = gem_create(kgem->fd, 1);
154463ef14f0Smrg	if (create.handle == 0)
154563ef14f0Smrg		return false;
15469a906b70Schristos
154763ef14f0Smrg	if (drmIoctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &create) == 0) {
154863ef14f0Smrg		struct drm_mode_fb_dirty_cmd dirty;
154963ef14f0Smrg
155063ef14f0Smrg		memset(&dirty, 0, sizeof(dirty));
155163ef14f0Smrg		dirty.fb_id = create.fb_id;
155263ef14f0Smrg		ret = drmIoctl(kgem->fd,
155363ef14f0Smrg			       DRM_IOCTL_MODE_DIRTYFB,
155463ef14f0Smrg			       &dirty) == 0;
155563ef14f0Smrg
155663ef14f0Smrg		/* XXX There may be multiple levels of DIRTYFB, depending on
155763ef14f0Smrg		 * whether the kernel thinks tracking dirty regions is
155863ef14f0Smrg		 * beneficial vs flagging the whole fb as dirty.
155963ef14f0Smrg		 */
156063ef14f0Smrg
156163ef14f0Smrg		drmIoctl(kgem->fd,
156263ef14f0Smrg			 DRM_IOCTL_MODE_RMFB,
156363ef14f0Smrg			 &create.fb_id);
15649a906b70Schristos	}
156563ef14f0Smrg	gem_close(kgem->fd, create.handle);
15669a906b70Schristos
156763ef14f0Smrg	return ret;
15689a906b70Schristos}
15699a906b70Schristos
157063ef14f0Smrgstatic bool test_has_secure_batches(struct kgem *kgem)
15719a906b70Schristos{
157263ef14f0Smrg	if (DBG_NO_SECURE_BATCHES)
157363ef14f0Smrg		return false;
15749a906b70Schristos
157563ef14f0Smrg	return gem_param(kgem, LOCAL_I915_PARAM_HAS_SECURE_BATCHES) > 0;
157663ef14f0Smrg}
15779a906b70Schristos
157863ef14f0Smrgstatic bool test_has_pinned_batches(struct kgem *kgem)
157963ef14f0Smrg{
158063ef14f0Smrg	if (DBG_NO_PINNED_BATCHES)
158163ef14f0Smrg		return false;
15829a906b70Schristos
158363ef14f0Smrg	return gem_param(kgem, LOCAL_I915_PARAM_HAS_PINNED_BATCHES) > 0;
15849a906b70Schristos}
15859a906b70Schristos
158603b705cfSriastradhstatic bool kgem_init_pinned_batches(struct kgem *kgem)
158703b705cfSriastradh{
158803b705cfSriastradh	int count[2] = { 16, 4 };
158903b705cfSriastradh	int size[2] = { 1, 4 };
159063ef14f0Smrg	int ret = 0;
159103b705cfSriastradh	int n, i;
159203b705cfSriastradh
159363ef14f0Smrg	if (unlikely(kgem->wedged))
159403b705cfSriastradh		return true;
159503b705cfSriastradh
159603b705cfSriastradh	for (n = 0; n < ARRAY_SIZE(count); n++) {
159703b705cfSriastradh		for (i = 0; i < count[n]; i++) {
159803b705cfSriastradh			struct drm_i915_gem_pin pin;
159903b705cfSriastradh			struct kgem_bo *bo;
160003b705cfSriastradh
160103b705cfSriastradh			VG_CLEAR(pin);
160203b705cfSriastradh
160303b705cfSriastradh			pin.handle = gem_create(kgem->fd, size[n]);
160403b705cfSriastradh			if (pin.handle == 0)
160503b705cfSriastradh				goto err;
160603b705cfSriastradh
160703b705cfSriastradh			DBG(("%s: new handle=%d, num_pages=%d\n",
160803b705cfSriastradh			     __FUNCTION__, pin.handle, size[n]));
160903b705cfSriastradh
161003b705cfSriastradh			bo = __kgem_bo_alloc(pin.handle, size[n]);
161103b705cfSriastradh			if (bo == NULL) {
161203b705cfSriastradh				gem_close(kgem->fd, pin.handle);
161303b705cfSriastradh				goto err;
161403b705cfSriastradh			}
161503b705cfSriastradh
161603b705cfSriastradh			pin.alignment = 0;
161763ef14f0Smrg			ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_PIN, &pin);
161863ef14f0Smrg			if (ret) {
161903b705cfSriastradh				gem_close(kgem->fd, pin.handle);
16209a906b70Schristos				free(bo);
162103b705cfSriastradh				goto err;
162203b705cfSriastradh			}
162303b705cfSriastradh			bo->presumed_offset = pin.offset;
162403b705cfSriastradh			debug_alloc__bo(kgem, bo);
162503b705cfSriastradh			list_add(&bo->list, &kgem->pinned_batches[n]);
162603b705cfSriastradh		}
162703b705cfSriastradh	}
162803b705cfSriastradh
162903b705cfSriastradh	return true;
163003b705cfSriastradh
163103b705cfSriastradherr:
163203b705cfSriastradh	for (n = 0; n < ARRAY_SIZE(kgem->pinned_batches); n++) {
163303b705cfSriastradh		while (!list_is_empty(&kgem->pinned_batches[n])) {
163403b705cfSriastradh			kgem_bo_destroy(kgem,
163503b705cfSriastradh					list_first_entry(&kgem->pinned_batches[n],
163603b705cfSriastradh							 struct kgem_bo, list));
163703b705cfSriastradh		}
163803b705cfSriastradh	}
163903b705cfSriastradh
164063ef14f0Smrg	/* If we fail to pin some memory for 830gm/845g, we need to disable
164163ef14f0Smrg	 * acceleration as otherwise the machine will eventually fail. However,
164263ef14f0Smrg	 * the kernel started arbitrarily rejecting PIN, so hope for the best
164363ef14f0Smrg	 * if the ioctl no longer works.
164463ef14f0Smrg	 */
164563ef14f0Smrg	if (ret != -ENODEV && kgem->gen == 020)
164663ef14f0Smrg		return false;
164763ef14f0Smrg
164863ef14f0Smrg	kgem->has_pinned_batches = false;
164963ef14f0Smrg
165003b705cfSriastradh	/* For simplicity populate the lists with a single unpinned bo */
165103b705cfSriastradh	for (n = 0; n < ARRAY_SIZE(count); n++) {
165203b705cfSriastradh		struct kgem_bo *bo;
165303b705cfSriastradh		uint32_t handle;
165403b705cfSriastradh
165503b705cfSriastradh		handle = gem_create(kgem->fd, size[n]);
165603b705cfSriastradh		if (handle == 0)
165763ef14f0Smrg			return false;
165803b705cfSriastradh
165903b705cfSriastradh		bo = __kgem_bo_alloc(handle, size[n]);
166003b705cfSriastradh		if (bo == NULL) {
166103b705cfSriastradh			gem_close(kgem->fd, handle);
166263ef14f0Smrg			return false;
166303b705cfSriastradh		}
166403b705cfSriastradh
166503b705cfSriastradh		debug_alloc__bo(kgem, bo);
166603b705cfSriastradh		list_add(&bo->list, &kgem->pinned_batches[n]);
166703b705cfSriastradh	}
166863ef14f0Smrg	return true;
166903b705cfSriastradh}
167003b705cfSriastradh
167103b705cfSriastradhstatic void kgem_init_swizzling(struct kgem *kgem)
167203b705cfSriastradh{
1673813957e3Ssnj	struct local_i915_gem_get_tiling_v2 {
1674813957e3Ssnj		uint32_t handle;
1675813957e3Ssnj		uint32_t tiling_mode;
1676813957e3Ssnj		uint32_t swizzle_mode;
1677813957e3Ssnj		uint32_t phys_swizzle_mode;
1678813957e3Ssnj	} tiling;
1679813957e3Ssnj#define LOCAL_IOCTL_I915_GEM_GET_TILING DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_GET_TILING, struct local_i915_gem_get_tiling_v2)
168003b705cfSriastradh
168163ef14f0Smrg	memset(&tiling, 0, sizeof(tiling));
168203b705cfSriastradh	tiling.handle = gem_create(kgem->fd, 1);
168303b705cfSriastradh	if (!tiling.handle)
168403b705cfSriastradh		return;
168503b705cfSriastradh
168603b705cfSriastradh	if (!gem_set_tiling(kgem->fd, tiling.handle, I915_TILING_X, 512))
168703b705cfSriastradh		goto out;
168803b705cfSriastradh
1689813957e3Ssnj	if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_GET_TILING, &tiling))
1690813957e3Ssnj		goto out;
1691813957e3Ssnj
169263ef14f0Smrg	DBG(("%s: swizzle_mode=%d, phys_swizzle_mode=%d\n",
169363ef14f0Smrg	     __FUNCTION__, tiling.swizzle_mode, tiling.phys_swizzle_mode));
169463ef14f0Smrg
169563ef14f0Smrg	kgem->can_fence =
169663ef14f0Smrg		!DBG_NO_TILING &&
169763ef14f0Smrg		tiling.swizzle_mode != I915_BIT_6_SWIZZLE_UNKNOWN;
169863ef14f0Smrg
169963ef14f0Smrg	if (kgem->gen < 050 && tiling.phys_swizzle_mode != tiling.swizzle_mode)
170003b705cfSriastradh		goto out;
170103b705cfSriastradh
170263ef14f0Smrg	if (!DBG_NO_DETILING)
170363ef14f0Smrg		choose_memcpy_tiled_x(kgem,
170463ef14f0Smrg				      tiling.swizzle_mode,
170563ef14f0Smrg				      __to_sna(kgem)->cpu_features);
170603b705cfSriastradhout:
170703b705cfSriastradh	gem_close(kgem->fd, tiling.handle);
170863ef14f0Smrg	DBG(("%s: can fence?=%d\n", __FUNCTION__, kgem->can_fence));
170903b705cfSriastradh}
171003b705cfSriastradh
1711813957e3Ssnjstatic void kgem_fixup_relocs(struct kgem *kgem, struct kgem_bo *bo, int shrink)
1712813957e3Ssnj{
1713813957e3Ssnj	int n;
1714813957e3Ssnj
1715813957e3Ssnj	bo->target_handle = kgem->has_handle_lut ? kgem->nexec : bo->handle;
1716813957e3Ssnj
1717813957e3Ssnj	assert(kgem->nreloc__self <= 256);
1718813957e3Ssnj	if (kgem->nreloc__self == 0)
1719813957e3Ssnj		return;
1720813957e3Ssnj
1721813957e3Ssnj	DBG(("%s: fixing up %d%s self-relocations to handle=%p, presumed-offset=%llx\n",
1722813957e3Ssnj	     __FUNCTION__, kgem->nreloc__self,
1723813957e3Ssnj	     kgem->nreloc__self == 256 ? "+" : "",
1724813957e3Ssnj	     bo->handle, (long long)bo->presumed_offset));
1725813957e3Ssnj	for (n = 0; n < kgem->nreloc__self; n++) {
1726813957e3Ssnj		int i = kgem->reloc__self[n];
172763ef14f0Smrg		uint64_t addr;
1728813957e3Ssnj
1729813957e3Ssnj		assert(kgem->reloc[i].target_handle == ~0U);
1730813957e3Ssnj		kgem->reloc[i].target_handle = bo->target_handle;
1731813957e3Ssnj		kgem->reloc[i].presumed_offset = bo->presumed_offset;
1732813957e3Ssnj
1733813957e3Ssnj		if (kgem->reloc[i].read_domains == I915_GEM_DOMAIN_INSTRUCTION) {
1734813957e3Ssnj			DBG(("%s: moving base of self-reloc[%d:%d] %d -> %d\n",
1735813957e3Ssnj			     __FUNCTION__, n, i,
1736813957e3Ssnj			     kgem->reloc[i].delta,
1737813957e3Ssnj			     kgem->reloc[i].delta - shrink));
1738813957e3Ssnj
1739813957e3Ssnj			kgem->reloc[i].delta -= shrink;
1740813957e3Ssnj		}
174163ef14f0Smrg		addr = (int)kgem->reloc[i].delta + bo->presumed_offset;
174263ef14f0Smrg		kgem->batch[kgem->reloc[i].offset/sizeof(uint32_t)] = addr;
174363ef14f0Smrg		if (kgem->gen >= 0100)
174463ef14f0Smrg			kgem->batch[kgem->reloc[i].offset/sizeof(uint32_t) + 1] = addr >> 32;
1745813957e3Ssnj	}
1746813957e3Ssnj
1747813957e3Ssnj	if (n == 256) {
1748813957e3Ssnj		for (n = kgem->reloc__self[255]; n < kgem->nreloc; n++) {
1749813957e3Ssnj			if (kgem->reloc[n].target_handle == ~0U) {
175063ef14f0Smrg				uint64_t addr;
175163ef14f0Smrg
1752813957e3Ssnj				kgem->reloc[n].target_handle = bo->target_handle;
1753813957e3Ssnj				kgem->reloc[n].presumed_offset = bo->presumed_offset;
1754813957e3Ssnj
1755813957e3Ssnj				if (kgem->reloc[n].read_domains == I915_GEM_DOMAIN_INSTRUCTION) {
1756813957e3Ssnj					DBG(("%s: moving base of reloc[%d] %d -> %d\n",
1757813957e3Ssnj					     __FUNCTION__, n,
1758813957e3Ssnj					     kgem->reloc[n].delta,
1759813957e3Ssnj					     kgem->reloc[n].delta - shrink));
1760813957e3Ssnj					kgem->reloc[n].delta -= shrink;
1761813957e3Ssnj				}
176263ef14f0Smrg
176363ef14f0Smrg				addr = (int)kgem->reloc[n].delta + bo->presumed_offset;
176463ef14f0Smrg				kgem->batch[kgem->reloc[n].offset/sizeof(uint32_t)] = addr;
176563ef14f0Smrg				if (kgem->gen >= 0100)
176663ef14f0Smrg					kgem->batch[kgem->reloc[n].offset/sizeof(uint32_t) + 1] = addr >> 32;
1767813957e3Ssnj			}
1768813957e3Ssnj		}
1769813957e3Ssnj	}
1770813957e3Ssnj
1771813957e3Ssnj	if (shrink) {
1772813957e3Ssnj		DBG(("%s: shrinking by %d\n", __FUNCTION__, shrink));
1773813957e3Ssnj		for (n = 0; n < kgem->nreloc; n++) {
1774813957e3Ssnj			if (kgem->reloc[n].offset >= sizeof(uint32_t)*kgem->nbatch)
1775813957e3Ssnj				kgem->reloc[n].offset -= shrink;
1776813957e3Ssnj		}
1777813957e3Ssnj	}
1778813957e3Ssnj}
1779813957e3Ssnj
178063ef14f0Smrgstatic int kgem_bo_wait(struct kgem *kgem, struct kgem_bo *bo)
178163ef14f0Smrg{
178263ef14f0Smrg	struct local_i915_gem_wait {
178363ef14f0Smrg		uint32_t handle;
178463ef14f0Smrg		uint32_t flags;
178563ef14f0Smrg		int64_t timeout;
178663ef14f0Smrg	} wait;
178763ef14f0Smrg#define LOCAL_I915_GEM_WAIT       0x2c
178863ef14f0Smrg#define LOCAL_IOCTL_I915_GEM_WAIT         DRM_IOWR(DRM_COMMAND_BASE + LOCAL_I915_GEM_WAIT, struct local_i915_gem_wait)
178963ef14f0Smrg	int ret;
179063ef14f0Smrg
179163ef14f0Smrg	DBG(("%s: waiting for handle=%d\n", __FUNCTION__, bo->handle));
179263ef14f0Smrg	if (bo->rq == NULL)
179363ef14f0Smrg		return 0;
179463ef14f0Smrg
179563ef14f0Smrg	VG_CLEAR(wait);
179663ef14f0Smrg	wait.handle = bo->handle;
179763ef14f0Smrg	wait.flags = 0;
179863ef14f0Smrg	wait.timeout = -1;
179963ef14f0Smrg	ret = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_WAIT, &wait);
180063ef14f0Smrg	if (ret) {
180163ef14f0Smrg		struct drm_i915_gem_set_domain set_domain;
180263ef14f0Smrg
180363ef14f0Smrg		VG_CLEAR(set_domain);
180463ef14f0Smrg		set_domain.handle = bo->handle;
180563ef14f0Smrg		set_domain.read_domains = I915_GEM_DOMAIN_GTT;
180663ef14f0Smrg		set_domain.write_domain = I915_GEM_DOMAIN_GTT;
180763ef14f0Smrg		ret = do_ioctl(kgem->fd,
180863ef14f0Smrg			       DRM_IOCTL_I915_GEM_SET_DOMAIN,
180963ef14f0Smrg			       &set_domain);
181063ef14f0Smrg	}
181163ef14f0Smrg
181263ef14f0Smrg	if (ret == 0)
181363ef14f0Smrg		__kgem_retire_requests_upto(kgem, bo);
181463ef14f0Smrg
181563ef14f0Smrg	return ret;
181663ef14f0Smrg}
181763ef14f0Smrg
1818813957e3Ssnjstatic struct kgem_bo *kgem_new_batch(struct kgem *kgem)
1819813957e3Ssnj{
1820813957e3Ssnj	struct kgem_bo *last;
1821813957e3Ssnj	unsigned flags;
1822813957e3Ssnj
1823813957e3Ssnj	last = kgem->batch_bo;
1824813957e3Ssnj	if (last) {
1825813957e3Ssnj		kgem_fixup_relocs(kgem, last, 0);
1826813957e3Ssnj		kgem->batch = NULL;
1827813957e3Ssnj	}
1828813957e3Ssnj
1829813957e3Ssnj	if (kgem->batch) {
1830813957e3Ssnj		assert(last == NULL);
1831813957e3Ssnj		return NULL;
1832813957e3Ssnj	}
1833813957e3Ssnj
1834813957e3Ssnj	flags = CREATE_CPU_MAP | CREATE_NO_THROTTLE;
1835813957e3Ssnj	if (!kgem->has_llc)
1836813957e3Ssnj		flags |= CREATE_UNCACHED;
1837813957e3Ssnj
183863ef14f0Smrgrestart:
1839813957e3Ssnj	kgem->batch_bo = kgem_create_linear(kgem,
1840813957e3Ssnj					    sizeof(uint32_t)*kgem->batch_size,
1841813957e3Ssnj					    flags);
1842813957e3Ssnj	if (kgem->batch_bo)
1843813957e3Ssnj		kgem->batch = kgem_bo_map__cpu(kgem, kgem->batch_bo);
1844813957e3Ssnj	if (kgem->batch == NULL) {
184563ef14f0Smrg		int ring = kgem->ring == KGEM_BLT;
184663ef14f0Smrg		assert(ring < ARRAY_SIZE(kgem->requests));
184763ef14f0Smrg
1848813957e3Ssnj		if (kgem->batch_bo) {
1849813957e3Ssnj			kgem_bo_destroy(kgem, kgem->batch_bo);
1850813957e3Ssnj			kgem->batch_bo = NULL;
1851813957e3Ssnj		}
1852813957e3Ssnj
185363ef14f0Smrg		if (!list_is_empty(&kgem->requests[ring])) {
185463ef14f0Smrg			struct kgem_request *rq;
185563ef14f0Smrg
185663ef14f0Smrg			rq = list_first_entry(&kgem->requests[ring],
185763ef14f0Smrg					      struct kgem_request, list);
185863ef14f0Smrg			assert(rq->ring == ring);
185963ef14f0Smrg			assert(rq->bo);
186063ef14f0Smrg			assert(RQ(rq->bo->rq) == rq);
186163ef14f0Smrg			if (kgem_bo_wait(kgem, rq->bo) == 0)
186263ef14f0Smrg				goto restart;
186363ef14f0Smrg		}
186463ef14f0Smrg
186563ef14f0Smrg		if (flags & CREATE_NO_THROTTLE) {
186663ef14f0Smrg			flags &= ~CREATE_NO_THROTTLE;
186763ef14f0Smrg			if (kgem_cleanup_cache(kgem))
186863ef14f0Smrg				goto restart;
186963ef14f0Smrg		}
187063ef14f0Smrg
187163ef14f0Smrg		DBG(("%s: unable to map batch bo, mallocing(size=%d)\n",
187263ef14f0Smrg		     __FUNCTION__, sizeof(uint32_t)*kgem->batch_size));
1873813957e3Ssnj		if (posix_memalign((void **)&kgem->batch, PAGE_SIZE,
1874813957e3Ssnj				   ALIGN(sizeof(uint32_t) * kgem->batch_size, PAGE_SIZE))) {
1875813957e3Ssnj			ERR(("%s: batch allocation failed, disabling acceleration\n", __FUNCTION__));
1876813957e3Ssnj			__kgem_set_wedged(kgem);
1877813957e3Ssnj		}
1878813957e3Ssnj	} else {
1879813957e3Ssnj		DBG(("%s: allocated and mapped batch handle=%d [size=%d]\n",
1880813957e3Ssnj		     __FUNCTION__, kgem->batch_bo->handle,
1881813957e3Ssnj		     sizeof(uint32_t)*kgem->batch_size));
1882813957e3Ssnj		kgem_bo_sync__cpu(kgem, kgem->batch_bo);
1883813957e3Ssnj	}
1884813957e3Ssnj
1885813957e3Ssnj	DBG(("%s: using last batch handle=%d\n",
1886813957e3Ssnj	     __FUNCTION__, last ? last->handle : 0));
1887813957e3Ssnj	return last;
1888813957e3Ssnj}
188903b705cfSriastradh
189063ef14f0Smrgstatic void
189163ef14f0Smrgno_retire(struct kgem *kgem)
189263ef14f0Smrg{
189363ef14f0Smrg	(void)kgem;
189463ef14f0Smrg}
189563ef14f0Smrg
189663ef14f0Smrgstatic void
189763ef14f0Smrgno_expire(struct kgem *kgem)
189863ef14f0Smrg{
189963ef14f0Smrg	(void)kgem;
190063ef14f0Smrg}
190163ef14f0Smrg
190263ef14f0Smrgstatic void
190363ef14f0Smrgno_context_switch(struct kgem *kgem, int new_mode)
190463ef14f0Smrg{
190563ef14f0Smrg	(void)kgem;
190663ef14f0Smrg	(void)new_mode;
190763ef14f0Smrg}
190863ef14f0Smrg
190963ef14f0Smrgstatic uint64_t get_gtt_size(int fd)
191003b705cfSriastradh{
191103b705cfSriastradh	struct drm_i915_gem_get_aperture aperture;
191263ef14f0Smrg	struct local_i915_gem_context_param {
191363ef14f0Smrg		uint32_t context;
191463ef14f0Smrg		uint32_t size;
191563ef14f0Smrg		uint64_t param;
191663ef14f0Smrg#define LOCAL_CONTEXT_PARAM_BAN_PERIOD	0x1
191763ef14f0Smrg#define LOCAL_CONTEXT_PARAM_NO_ZEROMAP	0x2
191863ef14f0Smrg#define LOCAL_CONTEXT_PARAM_GTT_SIZE	0x3
191963ef14f0Smrg		uint64_t value;
192063ef14f0Smrg	} p;
192163ef14f0Smrg#define LOCAL_I915_GEM_CONTEXT_GETPARAM       0x34
192263ef14f0Smrg#define LOCAL_IOCTL_I915_GEM_CONTEXT_GETPARAM DRM_IOWR (DRM_COMMAND_BASE + LOCAL_I915_GEM_CONTEXT_GETPARAM, struct local_i915_gem_context_param)
192363ef14f0Smrg
192463ef14f0Smrg	memset(&aperture, 0, sizeof(aperture));
192563ef14f0Smrg
192663ef14f0Smrg	memset(&p, 0, sizeof(p));
192763ef14f0Smrg	p.param = LOCAL_CONTEXT_PARAM_GTT_SIZE;
192863ef14f0Smrg	if (drmIoctl(fd, LOCAL_IOCTL_I915_GEM_CONTEXT_GETPARAM, &p) == 0)
192963ef14f0Smrg		aperture.aper_size = p.value;
193063ef14f0Smrg	if (aperture.aper_size == 0)
193163ef14f0Smrg		(void)drmIoctl(fd, DRM_IOCTL_I915_GEM_GET_APERTURE, &aperture);
193263ef14f0Smrg	if (aperture.aper_size == 0)
193363ef14f0Smrg		aperture.aper_size = 64*1024*1024;
193463ef14f0Smrg
193563ef14f0Smrg	DBG(("%s: aperture size %lld, available now %lld\n",
193663ef14f0Smrg	     __FUNCTION__,
193763ef14f0Smrg	     (long long)aperture.aper_size,
193863ef14f0Smrg	     (long long)aperture.aper_available_size));
193963ef14f0Smrg
194063ef14f0Smrg	/* clamp aperture to uint32_t for simplicity */
194163ef14f0Smrg	if (aperture.aper_size > 0xc0000000)
194263ef14f0Smrg		aperture.aper_size = 0xc0000000;
194363ef14f0Smrg
194463ef14f0Smrg	return aperture.aper_size;
194563ef14f0Smrg}
194663ef14f0Smrg
194763ef14f0Smrgvoid kgem_init(struct kgem *kgem, int fd, struct pci_device *dev, unsigned gen)
194863ef14f0Smrg{
194903b705cfSriastradh	size_t totalram;
195003b705cfSriastradh	unsigned half_gpu_max;
195103b705cfSriastradh	unsigned int i, j;
195263ef14f0Smrg	uint64_t gtt_size;
195303b705cfSriastradh
195403b705cfSriastradh	DBG(("%s: fd=%d, gen=%d\n", __FUNCTION__, fd, gen));
195503b705cfSriastradh
195603b705cfSriastradh	kgem->fd = fd;
195703b705cfSriastradh	kgem->gen = gen;
195803b705cfSriastradh
195963ef14f0Smrg	kgem->retire = no_retire;
196063ef14f0Smrg	kgem->expire = no_expire;
196163ef14f0Smrg	kgem->context_switch = no_context_switch;
196263ef14f0Smrg
196303b705cfSriastradh	list_init(&kgem->requests[0]);
196403b705cfSriastradh	list_init(&kgem->requests[1]);
196503b705cfSriastradh	list_init(&kgem->batch_buffers);
196603b705cfSriastradh	list_init(&kgem->active_buffers);
196703b705cfSriastradh	list_init(&kgem->flushing);
196803b705cfSriastradh	list_init(&kgem->large);
196903b705cfSriastradh	list_init(&kgem->large_inactive);
197003b705cfSriastradh	list_init(&kgem->snoop);
197103b705cfSriastradh	list_init(&kgem->scanout);
197203b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->pinned_batches); i++)
197303b705cfSriastradh		list_init(&kgem->pinned_batches[i]);
197403b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++)
197503b705cfSriastradh		list_init(&kgem->inactive[i]);
197603b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->active); i++) {
197703b705cfSriastradh		for (j = 0; j < ARRAY_SIZE(kgem->active[i]); j++)
197803b705cfSriastradh			list_init(&kgem->active[i][j]);
197903b705cfSriastradh	}
198003b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->vma); i++) {
198103b705cfSriastradh		for (j = 0; j < ARRAY_SIZE(kgem->vma[i].inactive); j++)
198203b705cfSriastradh			list_init(&kgem->vma[i].inactive[j]);
198303b705cfSriastradh	}
198403b705cfSriastradh	kgem->vma[MAP_GTT].count = -MAX_GTT_VMA_CACHE;
198503b705cfSriastradh	kgem->vma[MAP_CPU].count = -MAX_CPU_VMA_CACHE;
198603b705cfSriastradh
198703b705cfSriastradh	kgem->has_blt = gem_param(kgem, LOCAL_I915_PARAM_HAS_BLT) > 0;
198803b705cfSriastradh	DBG(("%s: has BLT ring? %d\n", __FUNCTION__,
198903b705cfSriastradh	     kgem->has_blt));
199003b705cfSriastradh
199103b705cfSriastradh	kgem->has_relaxed_delta =
199203b705cfSriastradh		gem_param(kgem, LOCAL_I915_PARAM_HAS_RELAXED_DELTA) > 0;
199303b705cfSriastradh	DBG(("%s: has relaxed delta? %d\n", __FUNCTION__,
199403b705cfSriastradh	     kgem->has_relaxed_delta));
199503b705cfSriastradh
199603b705cfSriastradh	kgem->has_relaxed_fencing = test_has_relaxed_fencing(kgem);
199703b705cfSriastradh	DBG(("%s: has relaxed fencing? %d\n", __FUNCTION__,
199803b705cfSriastradh	     kgem->has_relaxed_fencing));
199903b705cfSriastradh
200063ef14f0Smrg	kgem->has_coherent_mmap_gtt = test_has_coherent_mmap_gtt(kgem);
200163ef14f0Smrg	DBG(("%s: has coherent writes into GTT maps? %d\n", __FUNCTION__,
200263ef14f0Smrg	     kgem->has_coherent_mmap_gtt));
200363ef14f0Smrg
200403b705cfSriastradh	kgem->has_llc = test_has_llc(kgem);
200503b705cfSriastradh	DBG(("%s: has shared last-level-cache? %d\n", __FUNCTION__,
200603b705cfSriastradh	     kgem->has_llc));
200703b705cfSriastradh
200803b705cfSriastradh	kgem->has_wt = test_has_wt(kgem);
200903b705cfSriastradh	DBG(("%s: has write-through caching for scanouts? %d\n", __FUNCTION__,
201003b705cfSriastradh	     kgem->has_wt));
201103b705cfSriastradh
2012813957e3Ssnj	kgem->has_wc_mmap = test_has_wc_mmap(kgem);
2013813957e3Ssnj	DBG(("%s: has wc-mmapping? %d\n", __FUNCTION__,
2014813957e3Ssnj	     kgem->has_wc_mmap));
2015813957e3Ssnj
201603b705cfSriastradh	kgem->has_caching = test_has_caching(kgem);
201703b705cfSriastradh	DBG(("%s: has set-cache-level? %d\n", __FUNCTION__,
201803b705cfSriastradh	     kgem->has_caching));
201903b705cfSriastradh
202003b705cfSriastradh	kgem->has_userptr = test_has_userptr(kgem);
202103b705cfSriastradh	DBG(("%s: has userptr? %d\n", __FUNCTION__,
202203b705cfSriastradh	     kgem->has_userptr));
202303b705cfSriastradh
202403b705cfSriastradh	kgem->has_create2 = test_has_create2(kgem);
202503b705cfSriastradh	DBG(("%s: has create2? %d\n", __FUNCTION__,
202603b705cfSriastradh	     kgem->has_create2));
202703b705cfSriastradh
202803b705cfSriastradh	kgem->has_no_reloc = test_has_no_reloc(kgem);
202903b705cfSriastradh	DBG(("%s: has no-reloc? %d\n", __FUNCTION__,
203003b705cfSriastradh	     kgem->has_no_reloc));
203103b705cfSriastradh
203203b705cfSriastradh	kgem->has_handle_lut = test_has_handle_lut(kgem);
203303b705cfSriastradh	DBG(("%s: has handle-lut? %d\n", __FUNCTION__,
203403b705cfSriastradh	     kgem->has_handle_lut));
203503b705cfSriastradh
203603b705cfSriastradh	kgem->has_semaphores = false;
203703b705cfSriastradh	if (kgem->has_blt && test_has_semaphores_enabled(kgem))
203803b705cfSriastradh		kgem->has_semaphores = true;
203903b705cfSriastradh	DBG(("%s: semaphores enabled? %d\n", __FUNCTION__,
204003b705cfSriastradh	     kgem->has_semaphores));
204103b705cfSriastradh
204203b705cfSriastradh	kgem->can_blt_cpu = gen >= 030;
204303b705cfSriastradh	DBG(("%s: can blt to cpu? %d\n", __FUNCTION__,
204403b705cfSriastradh	     kgem->can_blt_cpu));
204503b705cfSriastradh
204663ef14f0Smrg	kgem->can_blt_y = test_can_blt_y(kgem);
204763ef14f0Smrg	DBG(("%s: can blit to Y-tiled surfaces? %d\n", __FUNCTION__,
204863ef14f0Smrg	     kgem->can_blt_y));
204963ef14f0Smrg
20509a906b70Schristos	kgem->can_render_y = gen != 021 && (gen >> 3) != 4;
20519a906b70Schristos	DBG(("%s: can render to Y-tiled surfaces? %d\n", __FUNCTION__,
20529a906b70Schristos	     kgem->can_render_y));
20539a906b70Schristos
205463ef14f0Smrg	kgem->can_scanout_y = test_can_scanout_y(kgem);
205563ef14f0Smrg	DBG(("%s: can scanout Y-tiled surfaces? %d\n", __FUNCTION__,
205663ef14f0Smrg	     kgem->can_scanout_y));
205763ef14f0Smrg
205863ef14f0Smrg	kgem->has_dirtyfb = test_has_dirtyfb(kgem);
205963ef14f0Smrg	DBG(("%s: has dirty fb? %d\n", __FUNCTION__, kgem->has_dirtyfb));
206063ef14f0Smrg
206103b705cfSriastradh	kgem->has_secure_batches = test_has_secure_batches(kgem);
206203b705cfSriastradh	DBG(("%s: can use privileged batchbuffers? %d\n", __FUNCTION__,
206303b705cfSriastradh	     kgem->has_secure_batches));
206403b705cfSriastradh
206503b705cfSriastradh	kgem->has_pinned_batches = test_has_pinned_batches(kgem);
206603b705cfSriastradh	DBG(("%s: can use pinned batchbuffers (to avoid CS w/a)? %d\n", __FUNCTION__,
206703b705cfSriastradh	     kgem->has_pinned_batches));
206803b705cfSriastradh
206903b705cfSriastradh	if (!is_hw_supported(kgem, dev)) {
207003b705cfSriastradh		xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING,
207103b705cfSriastradh			   "Detected unsupported/dysfunctional hardware, disabling acceleration.\n");
2072813957e3Ssnj		__kgem_set_wedged(kgem);
20739a906b70Schristos	} else if (__kgem_throttle(kgem, false)) {
207403b705cfSriastradh		xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING,
207503b705cfSriastradh			   "Detected a hung GPU, disabling acceleration.\n");
2076813957e3Ssnj		__kgem_set_wedged(kgem);
207703b705cfSriastradh	}
207803b705cfSriastradh
2079813957e3Ssnj	kgem->batch_size = UINT16_MAX & ~7;
208003b705cfSriastradh	if (gen == 020 && !kgem->has_pinned_batches)
208103b705cfSriastradh		/* Limited to what we can pin */
208203b705cfSriastradh		kgem->batch_size = 4*1024;
208303b705cfSriastradh	if (gen == 022)
208403b705cfSriastradh		/* 865g cannot handle a batch spanning multiple pages */
208503b705cfSriastradh		kgem->batch_size = PAGE_SIZE / sizeof(uint32_t);
20869a906b70Schristos	if (gen >= 070)
208703b705cfSriastradh		kgem->batch_size = 16*1024;
208803b705cfSriastradh	if (!kgem->has_relaxed_delta && kgem->batch_size > 4*1024)
208903b705cfSriastradh		kgem->batch_size = 4*1024;
209003b705cfSriastradh
209163ef14f0Smrg	if (!kgem_init_pinned_batches(kgem)) {
209203b705cfSriastradh		xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING,
209303b705cfSriastradh			   "Unable to reserve memory for GPU, disabling acceleration.\n");
2094813957e3Ssnj		__kgem_set_wedged(kgem);
209503b705cfSriastradh	}
209603b705cfSriastradh
209703b705cfSriastradh	DBG(("%s: maximum batch size? %d\n", __FUNCTION__,
209803b705cfSriastradh	     kgem->batch_size));
2099813957e3Ssnj	kgem_new_batch(kgem);
210003b705cfSriastradh
210103b705cfSriastradh	kgem->half_cpu_cache_pages = cpu_cache_size() >> 13;
210203b705cfSriastradh	DBG(("%s: last-level cache size: %d bytes, threshold in pages: %d\n",
210303b705cfSriastradh	     __FUNCTION__, cpu_cache_size(), kgem->half_cpu_cache_pages));
210403b705cfSriastradh
210503b705cfSriastradh	kgem->next_request = __kgem_request_alloc(kgem);
210603b705cfSriastradh
210703b705cfSriastradh	DBG(("%s: cpu bo enabled %d: llc? %d, set-cache-level? %d, userptr? %d\n", __FUNCTION__,
210803b705cfSriastradh	     !DBG_NO_CPU && (kgem->has_llc | kgem->has_userptr | kgem->has_caching),
210903b705cfSriastradh	     kgem->has_llc, kgem->has_caching, kgem->has_userptr));
211003b705cfSriastradh
211163ef14f0Smrg	gtt_size = get_gtt_size(fd);
211263ef14f0Smrg	kgem->aperture_total = gtt_size;
211363ef14f0Smrg	kgem->aperture_high = gtt_size * 3/4;
211463ef14f0Smrg	kgem->aperture_low = gtt_size * 1/3;
211503b705cfSriastradh	if (gen < 033) {
211603b705cfSriastradh		/* Severe alignment penalties */
211703b705cfSriastradh		kgem->aperture_high /= 2;
211803b705cfSriastradh		kgem->aperture_low /= 2;
211903b705cfSriastradh	}
212063ef14f0Smrg	DBG(("%s: aperture low=%u [%u], high=%u [%u]\n", __FUNCTION__,
212103b705cfSriastradh	     kgem->aperture_low, kgem->aperture_low / (1024*1024),
212203b705cfSriastradh	     kgem->aperture_high, kgem->aperture_high / (1024*1024)));
212303b705cfSriastradh
21249a906b70Schristos	kgem->aperture_mappable = 256 * 1024 * 1024;
21259a906b70Schristos	if (dev != NULL)
21269a906b70Schristos		kgem->aperture_mappable = agp_aperture_size(dev, gen);
212763ef14f0Smrg	if (kgem->aperture_mappable == 0 || kgem->aperture_mappable > gtt_size)
212863ef14f0Smrg		kgem->aperture_mappable = gtt_size;
212903b705cfSriastradh	DBG(("%s: aperture mappable=%d [%d MiB]\n", __FUNCTION__,
213003b705cfSriastradh	     kgem->aperture_mappable, kgem->aperture_mappable / (1024*1024)));
213103b705cfSriastradh
21329a906b70Schristos	kgem->aperture_fenceable = MIN(256*1024*1024, kgem->aperture_mappable);
21339a906b70Schristos	DBG(("%s: aperture fenceable=%d [%d MiB]\n", __FUNCTION__,
21349a906b70Schristos	     kgem->aperture_fenceable, kgem->aperture_fenceable / (1024*1024)));
21359a906b70Schristos
213603b705cfSriastradh	kgem->buffer_size = 64 * 1024;
213703b705cfSriastradh	while (kgem->buffer_size < kgem->aperture_mappable >> 10)
213803b705cfSriastradh		kgem->buffer_size *= 2;
213903b705cfSriastradh	if (kgem->buffer_size >> 12 > kgem->half_cpu_cache_pages)
214003b705cfSriastradh		kgem->buffer_size = kgem->half_cpu_cache_pages << 12;
214103b705cfSriastradh	kgem->buffer_size = 1 << __fls(kgem->buffer_size);
214203b705cfSriastradh	DBG(("%s: buffer size=%d [%d KiB]\n", __FUNCTION__,
214303b705cfSriastradh	     kgem->buffer_size, kgem->buffer_size / 1024));
214403b705cfSriastradh	assert(kgem->buffer_size);
214503b705cfSriastradh
214603b705cfSriastradh	kgem->max_object_size = 3 * (kgem->aperture_high >> 12) << 10;
214703b705cfSriastradh	kgem->max_gpu_size = kgem->max_object_size;
214803b705cfSriastradh	if (!kgem->has_llc && kgem->max_gpu_size > MAX_CACHE_SIZE)
214903b705cfSriastradh		kgem->max_gpu_size = MAX_CACHE_SIZE;
215003b705cfSriastradh
215103b705cfSriastradh	totalram = total_ram_size();
215203b705cfSriastradh	if (totalram == 0) {
215303b705cfSriastradh		DBG(("%s: total ram size unknown, assuming maximum of total aperture\n",
215403b705cfSriastradh		     __FUNCTION__));
215503b705cfSriastradh		totalram = kgem->aperture_total;
215603b705cfSriastradh	}
215763ef14f0Smrg	DBG(("%s: total ram=%lld\n", __FUNCTION__, (long long)totalram));
215803b705cfSriastradh	if (kgem->max_object_size > totalram / 2)
215903b705cfSriastradh		kgem->max_object_size = totalram / 2;
216003b705cfSriastradh	if (kgem->max_gpu_size > totalram / 4)
216103b705cfSriastradh		kgem->max_gpu_size = totalram / 4;
216203b705cfSriastradh
21639a906b70Schristos	if (kgem->aperture_high > totalram / 2) {
21649a906b70Schristos		kgem->aperture_high = totalram / 2;
21659a906b70Schristos		kgem->aperture_low = kgem->aperture_high / 4;
21669a906b70Schristos		DBG(("%s: reduced aperture watermaks to fit into ram; low=%d [%d], high=%d [%d]\n", __FUNCTION__,
21679a906b70Schristos		     kgem->aperture_low, kgem->aperture_low / (1024*1024),
21689a906b70Schristos		     kgem->aperture_high, kgem->aperture_high / (1024*1024)));
21699a906b70Schristos	}
21709a906b70Schristos
217103b705cfSriastradh	kgem->max_cpu_size = kgem->max_object_size;
217203b705cfSriastradh
217303b705cfSriastradh	half_gpu_max = kgem->max_gpu_size / 2;
217403b705cfSriastradh	kgem->max_copy_tile_size = (MAX_CACHE_SIZE + 1)/2;
217503b705cfSriastradh	if (kgem->max_copy_tile_size > half_gpu_max)
217603b705cfSriastradh		kgem->max_copy_tile_size = half_gpu_max;
217703b705cfSriastradh
217803b705cfSriastradh	if (kgem->has_llc)
217903b705cfSriastradh		kgem->max_upload_tile_size = kgem->max_copy_tile_size;
218003b705cfSriastradh	else
21819a906b70Schristos		kgem->max_upload_tile_size = kgem->aperture_fenceable / 4;
218203b705cfSriastradh	if (kgem->max_upload_tile_size > half_gpu_max)
218303b705cfSriastradh		kgem->max_upload_tile_size = half_gpu_max;
218403b705cfSriastradh	if (kgem->max_upload_tile_size > kgem->aperture_high/2)
218503b705cfSriastradh		kgem->max_upload_tile_size = kgem->aperture_high/2;
218603b705cfSriastradh	if (kgem->max_upload_tile_size > kgem->aperture_low)
218703b705cfSriastradh		kgem->max_upload_tile_size = kgem->aperture_low;
218803b705cfSriastradh	if (kgem->max_upload_tile_size < 16*PAGE_SIZE)
218903b705cfSriastradh		kgem->max_upload_tile_size = 16*PAGE_SIZE;
219003b705cfSriastradh
219103b705cfSriastradh	kgem->large_object_size = MAX_CACHE_SIZE;
219203b705cfSriastradh	if (kgem->large_object_size > half_gpu_max)
219303b705cfSriastradh		kgem->large_object_size = half_gpu_max;
219403b705cfSriastradh	if (kgem->max_copy_tile_size > kgem->aperture_high/2)
219503b705cfSriastradh		kgem->max_copy_tile_size = kgem->aperture_high/2;
219603b705cfSriastradh	if (kgem->max_copy_tile_size > kgem->aperture_low)
219703b705cfSriastradh		kgem->max_copy_tile_size = kgem->aperture_low;
219803b705cfSriastradh	if (kgem->max_copy_tile_size < 16*PAGE_SIZE)
219903b705cfSriastradh		kgem->max_copy_tile_size = 16*PAGE_SIZE;
220003b705cfSriastradh
220103b705cfSriastradh	if (kgem->has_llc | kgem->has_caching | kgem->has_userptr) {
220203b705cfSriastradh		if (kgem->large_object_size > kgem->max_cpu_size)
220303b705cfSriastradh			kgem->large_object_size = kgem->max_cpu_size;
220403b705cfSriastradh	} else
220503b705cfSriastradh		kgem->max_cpu_size = 0;
220603b705cfSriastradh	if (DBG_NO_CPU)
220703b705cfSriastradh		kgem->max_cpu_size = 0;
220803b705cfSriastradh
220963ef14f0Smrg	DBG(("%s: maximum object size=%u\n",
221003b705cfSriastradh	     __FUNCTION__, kgem->max_object_size));
221163ef14f0Smrg	DBG(("%s: large object thresold=%u\n",
221203b705cfSriastradh	     __FUNCTION__, kgem->large_object_size));
221363ef14f0Smrg	DBG(("%s: max object sizes (gpu=%u, cpu=%u, tile upload=%u, copy=%u)\n",
221403b705cfSriastradh	     __FUNCTION__,
221503b705cfSriastradh	     kgem->max_gpu_size, kgem->max_cpu_size,
221603b705cfSriastradh	     kgem->max_upload_tile_size, kgem->max_copy_tile_size));
221703b705cfSriastradh
221803b705cfSriastradh	/* Convert the aperture thresholds to pages */
22199a906b70Schristos	kgem->aperture_mappable /= PAGE_SIZE;
22209a906b70Schristos	kgem->aperture_fenceable /= PAGE_SIZE;
222103b705cfSriastradh	kgem->aperture_low /= PAGE_SIZE;
222203b705cfSriastradh	kgem->aperture_high /= PAGE_SIZE;
22239a906b70Schristos	kgem->aperture_total /= PAGE_SIZE;
222403b705cfSriastradh
222503b705cfSriastradh	kgem->fence_max = gem_param(kgem, I915_PARAM_NUM_FENCES_AVAIL) - 2;
222603b705cfSriastradh	if ((int)kgem->fence_max < 0)
222703b705cfSriastradh		kgem->fence_max = 5; /* minimum safe value for all hw */
222803b705cfSriastradh	DBG(("%s: max fences=%d\n", __FUNCTION__, kgem->fence_max));
222903b705cfSriastradh
223003b705cfSriastradh	kgem->batch_flags_base = 0;
223103b705cfSriastradh	if (kgem->has_no_reloc)
223203b705cfSriastradh		kgem->batch_flags_base |= LOCAL_I915_EXEC_NO_RELOC;
223303b705cfSriastradh	if (kgem->has_handle_lut)
223403b705cfSriastradh		kgem->batch_flags_base |= LOCAL_I915_EXEC_HANDLE_LUT;
223503b705cfSriastradh	if (kgem->has_pinned_batches)
223603b705cfSriastradh		kgem->batch_flags_base |= LOCAL_I915_EXEC_IS_PINNED;
223703b705cfSriastradh
223803b705cfSriastradh	kgem_init_swizzling(kgem);
223903b705cfSriastradh}
224003b705cfSriastradh
224103b705cfSriastradh/* XXX hopefully a good approximation */
22429a906b70Schristosstatic uint32_t kgem_get_unique_id(struct kgem *kgem)
224303b705cfSriastradh{
224403b705cfSriastradh	uint32_t id;
224503b705cfSriastradh	id = ++kgem->unique_id;
224603b705cfSriastradh	if (id == 0)
224703b705cfSriastradh		id = ++kgem->unique_id;
224803b705cfSriastradh	return id;
224903b705cfSriastradh}
225003b705cfSriastradh
225103b705cfSriastradhinline static uint32_t kgem_pitch_alignment(struct kgem *kgem, unsigned flags)
225203b705cfSriastradh{
225303b705cfSriastradh	if (flags & CREATE_PRIME)
225403b705cfSriastradh		return 256;
225503b705cfSriastradh	if (flags & CREATE_SCANOUT)
225603b705cfSriastradh		return 64;
2257813957e3Ssnj	if (kgem->gen >= 0100)
2258813957e3Ssnj		return 32;
22599a906b70Schristos	return 8;
226003b705cfSriastradh}
226103b705cfSriastradh
22629a906b70Schristosvoid kgem_get_tile_size(struct kgem *kgem, int tiling, int pitch,
226303b705cfSriastradh			int *tile_width, int *tile_height, int *tile_size)
226403b705cfSriastradh{
226503b705cfSriastradh	if (kgem->gen <= 030) {
226603b705cfSriastradh		if (tiling) {
226703b705cfSriastradh			if (kgem->gen < 030) {
226803b705cfSriastradh				*tile_width = 128;
226903b705cfSriastradh				*tile_height = 16;
227003b705cfSriastradh				*tile_size = 2048;
227103b705cfSriastradh			} else {
227203b705cfSriastradh				*tile_width = 512;
227303b705cfSriastradh				*tile_height = 8;
227403b705cfSriastradh				*tile_size = 4096;
227503b705cfSriastradh			}
227603b705cfSriastradh		} else {
227703b705cfSriastradh			*tile_width = 1;
227803b705cfSriastradh			*tile_height = 1;
227903b705cfSriastradh			*tile_size = 1;
228003b705cfSriastradh		}
228103b705cfSriastradh	} else switch (tiling) {
228203b705cfSriastradh	default:
228303b705cfSriastradh	case I915_TILING_NONE:
228403b705cfSriastradh		*tile_width = 1;
228503b705cfSriastradh		*tile_height = 1;
228603b705cfSriastradh		*tile_size = 1;
228703b705cfSriastradh		break;
228803b705cfSriastradh	case I915_TILING_X:
228903b705cfSriastradh		*tile_width = 512;
229003b705cfSriastradh		*tile_height = 8;
229103b705cfSriastradh		*tile_size = 4096;
229203b705cfSriastradh		break;
229303b705cfSriastradh	case I915_TILING_Y:
229403b705cfSriastradh		*tile_width = 128;
229503b705cfSriastradh		*tile_height = 32;
229603b705cfSriastradh		*tile_size = 4096;
229703b705cfSriastradh		break;
229803b705cfSriastradh	}
22999a906b70Schristos
23009a906b70Schristos	/* Force offset alignment to tile-row */
23019a906b70Schristos	if (tiling && kgem->gen < 033)
23029a906b70Schristos		*tile_width = pitch;
230303b705cfSriastradh}
230403b705cfSriastradh
230503b705cfSriastradhstatic uint32_t kgem_surface_size(struct kgem *kgem,
230603b705cfSriastradh				  bool relaxed_fencing,
230703b705cfSriastradh				  unsigned flags,
230803b705cfSriastradh				  uint32_t width,
230903b705cfSriastradh				  uint32_t height,
231003b705cfSriastradh				  uint32_t bpp,
231103b705cfSriastradh				  uint32_t tiling,
231203b705cfSriastradh				  uint32_t *pitch)
231303b705cfSriastradh{
231403b705cfSriastradh	uint32_t tile_width, tile_height;
231503b705cfSriastradh	uint32_t size;
231603b705cfSriastradh
231703b705cfSriastradh	assert(width <= MAXSHORT);
231803b705cfSriastradh	assert(height <= MAXSHORT);
231903b705cfSriastradh	assert(bpp >= 8);
232003b705cfSriastradh
232103b705cfSriastradh	if (kgem->gen <= 030) {
232203b705cfSriastradh		if (tiling) {
232303b705cfSriastradh			if (kgem->gen < 030) {
232403b705cfSriastradh				tile_width = 128;
23259a906b70Schristos				tile_height = 16;
232603b705cfSriastradh			} else {
232703b705cfSriastradh				tile_width = 512;
23289a906b70Schristos				tile_height = 8;
232903b705cfSriastradh			}
233003b705cfSriastradh		} else {
233103b705cfSriastradh			tile_width = 2 * bpp >> 3;
233203b705cfSriastradh			tile_width = ALIGN(tile_width,
233303b705cfSriastradh					   kgem_pitch_alignment(kgem, flags));
23349a906b70Schristos			tile_height = 1;
233503b705cfSriastradh		}
233603b705cfSriastradh	} else switch (tiling) {
233703b705cfSriastradh	default:
233803b705cfSriastradh	case I915_TILING_NONE:
233903b705cfSriastradh		tile_width = 2 * bpp >> 3;
234003b705cfSriastradh		tile_width = ALIGN(tile_width,
234103b705cfSriastradh				   kgem_pitch_alignment(kgem, flags));
23429a906b70Schristos		tile_height = 1;
234303b705cfSriastradh		break;
234403b705cfSriastradh
234503b705cfSriastradh	case I915_TILING_X:
234603b705cfSriastradh		tile_width = 512;
23479a906b70Schristos		tile_height = 8;
234803b705cfSriastradh		break;
234903b705cfSriastradh	case I915_TILING_Y:
235003b705cfSriastradh		tile_width = 128;
23519a906b70Schristos		tile_height = 32;
235203b705cfSriastradh		break;
235303b705cfSriastradh	}
23549a906b70Schristos	/* XXX align to an even tile row */
23559a906b70Schristos	if (!kgem->has_relaxed_fencing)
23569a906b70Schristos		tile_height *= 2;
235703b705cfSriastradh
235803b705cfSriastradh	*pitch = ALIGN(width * bpp / 8, tile_width);
235903b705cfSriastradh	height = ALIGN(height, tile_height);
23609a906b70Schristos	DBG(("%s: tile_width=%d, tile_height=%d => aligned pitch=%d, height=%d\n",
23619a906b70Schristos	     __FUNCTION__, tile_width, tile_height, *pitch, height));
23629a906b70Schristos
236303b705cfSriastradh	if (kgem->gen >= 040)
236403b705cfSriastradh		return PAGE_ALIGN(*pitch * height);
236503b705cfSriastradh
236603b705cfSriastradh	/* If it is too wide for the blitter, don't even bother.  */
236703b705cfSriastradh	if (tiling != I915_TILING_NONE) {
23689a906b70Schristos		if (*pitch > 8192) {
23699a906b70Schristos			DBG(("%s: too wide for tiled surface (pitch=%d, limit=%d)\n",
23709a906b70Schristos			     __FUNCTION__, *pitch, 8192));
237103b705cfSriastradh			return 0;
23729a906b70Schristos		}
237303b705cfSriastradh
237403b705cfSriastradh		for (size = tile_width; size < *pitch; size <<= 1)
237503b705cfSriastradh			;
237603b705cfSriastradh		*pitch = size;
237703b705cfSriastradh	} else {
23789a906b70Schristos		if (*pitch >= 32768) {
23799a906b70Schristos			DBG(("%s: too wide for linear surface (pitch=%d, limit=%d)\n",
23809a906b70Schristos			     __FUNCTION__, *pitch, 32767));
238103b705cfSriastradh			return 0;
23829a906b70Schristos		}
238303b705cfSriastradh	}
238403b705cfSriastradh
238503b705cfSriastradh	size = *pitch * height;
238603b705cfSriastradh	if (relaxed_fencing || tiling == I915_TILING_NONE)
238703b705cfSriastradh		return PAGE_ALIGN(size);
238803b705cfSriastradh
23899a906b70Schristos	/* We need to allocate a pot fence region for a tiled buffer. */
239003b705cfSriastradh	if (kgem->gen < 030)
239103b705cfSriastradh		tile_width = 512 * 1024;
239203b705cfSriastradh	else
239303b705cfSriastradh		tile_width = 1024 * 1024;
239403b705cfSriastradh	while (tile_width < size)
239503b705cfSriastradh		tile_width *= 2;
239603b705cfSriastradh	return tile_width;
239703b705cfSriastradh}
239803b705cfSriastradh
23999a906b70Schristosbool kgem_check_surface_size(struct kgem *kgem,
24009a906b70Schristos			     uint32_t width,
24019a906b70Schristos			     uint32_t height,
24029a906b70Schristos			     uint32_t bpp,
24039a906b70Schristos			     uint32_t tiling,
24049a906b70Schristos			     uint32_t pitch,
24059a906b70Schristos			     uint32_t size)
24069a906b70Schristos{
24079a906b70Schristos	uint32_t min_size, min_pitch;
24089a906b70Schristos	int tile_width, tile_height, tile_size;
24099a906b70Schristos
24109a906b70Schristos	DBG(("%s(width=%d, height=%d, bpp=%d, tiling=%d, pitch=%d, size=%d)\n",
24119a906b70Schristos	     __FUNCTION__, width, height, bpp, tiling, pitch, size));
24129a906b70Schristos
24139a906b70Schristos	if (pitch & 3)
24149a906b70Schristos		return false;
24159a906b70Schristos
24169a906b70Schristos	min_size = kgem_surface_size(kgem, kgem->has_relaxed_fencing, 0,
24179a906b70Schristos				     width, height, bpp, tiling,
24189a906b70Schristos				     &min_pitch);
24199a906b70Schristos
24209a906b70Schristos	DBG(("%s: min_pitch=%d, min_size=%d\n", __FUNCTION__, min_pitch, min_size));
24219a906b70Schristos
24229a906b70Schristos	if (size < min_size)
24239a906b70Schristos		return false;
24249a906b70Schristos
24259a906b70Schristos	if (pitch < min_pitch)
24269a906b70Schristos		return false;
24279a906b70Schristos
24289a906b70Schristos	kgem_get_tile_size(kgem, tiling, min_pitch,
24299a906b70Schristos			   &tile_width, &tile_height, &tile_size);
24309a906b70Schristos
24319a906b70Schristos	DBG(("%s: tile_width=%d, tile_size=%d\n", __FUNCTION__, tile_width, tile_size));
24329a906b70Schristos	if (pitch & (tile_width - 1))
24339a906b70Schristos		return false;
24349a906b70Schristos	if (size & (tile_size - 1))
24359a906b70Schristos		return false;
24369a906b70Schristos
24379a906b70Schristos	return true;
24389a906b70Schristos}
24399a906b70Schristos
244003b705cfSriastradhstatic uint32_t kgem_aligned_height(struct kgem *kgem,
244103b705cfSriastradh				    uint32_t height, uint32_t tiling)
244203b705cfSriastradh{
244303b705cfSriastradh	uint32_t tile_height;
244403b705cfSriastradh
244503b705cfSriastradh	if (kgem->gen <= 030) {
24469a906b70Schristos		tile_height = tiling ? kgem->gen < 030 ? 16 : 8 : 1;
244703b705cfSriastradh	} else switch (tiling) {
244803b705cfSriastradh		/* XXX align to an even tile row */
244903b705cfSriastradh	default:
245003b705cfSriastradh	case I915_TILING_NONE:
245103b705cfSriastradh		tile_height = 1;
245203b705cfSriastradh		break;
245303b705cfSriastradh	case I915_TILING_X:
24549a906b70Schristos		tile_height = 8;
245503b705cfSriastradh		break;
245603b705cfSriastradh	case I915_TILING_Y:
24579a906b70Schristos		tile_height = 32;
245803b705cfSriastradh		break;
245903b705cfSriastradh	}
246003b705cfSriastradh
24619a906b70Schristos	/* XXX align to an even tile row */
24629a906b70Schristos	if (!kgem->has_relaxed_fencing)
24639a906b70Schristos		tile_height *= 2;
24649a906b70Schristos
246503b705cfSriastradh	return ALIGN(height, tile_height);
246603b705cfSriastradh}
246703b705cfSriastradh
246803b705cfSriastradhstatic struct drm_i915_gem_exec_object2 *
246903b705cfSriastradhkgem_add_handle(struct kgem *kgem, struct kgem_bo *bo)
247003b705cfSriastradh{
247103b705cfSriastradh	struct drm_i915_gem_exec_object2 *exec;
247203b705cfSriastradh
247303b705cfSriastradh	DBG(("%s: handle=%d, index=%d\n",
247403b705cfSriastradh	     __FUNCTION__, bo->handle, kgem->nexec));
247503b705cfSriastradh
247603b705cfSriastradh	assert(kgem->nexec < ARRAY_SIZE(kgem->exec));
247703b705cfSriastradh	bo->target_handle = kgem->has_handle_lut ? kgem->nexec : bo->handle;
247803b705cfSriastradh	exec = memset(&kgem->exec[kgem->nexec++], 0, sizeof(*exec));
247903b705cfSriastradh	exec->handle = bo->handle;
248003b705cfSriastradh	exec->offset = bo->presumed_offset;
248103b705cfSriastradh
248203b705cfSriastradh	kgem->aperture += num_pages(bo);
248303b705cfSriastradh
248403b705cfSriastradh	return exec;
248503b705cfSriastradh}
248603b705cfSriastradh
248703b705cfSriastradhstatic void kgem_add_bo(struct kgem *kgem, struct kgem_bo *bo)
248803b705cfSriastradh{
24899a906b70Schristos	assert(bo->refcnt);
24909a906b70Schristos	assert(bo->proxy == NULL);
24919a906b70Schristos
249203b705cfSriastradh	bo->exec = kgem_add_handle(kgem, bo);
249303b705cfSriastradh	bo->rq = MAKE_REQUEST(kgem->next_request, kgem->ring);
249403b705cfSriastradh
249503b705cfSriastradh	list_move_tail(&bo->request, &kgem->next_request->buffers);
24969a906b70Schristos	if (bo->io && !list_is_empty(&bo->list))
24979a906b70Schristos		list_move(&bo->list, &kgem->batch_buffers);
249803b705cfSriastradh
249903b705cfSriastradh	/* XXX is it worth working around gcc here? */
250003b705cfSriastradh	kgem->flush |= bo->flush;
250103b705cfSriastradh}
250203b705cfSriastradh
250363ef14f0Smrgstatic void kgem_clear_swctrl(struct kgem *kgem)
250463ef14f0Smrg{
250563ef14f0Smrg	uint32_t *b;
250663ef14f0Smrg
250763ef14f0Smrg	if (kgem->bcs_state == 0)
250863ef14f0Smrg		return;
250963ef14f0Smrg
251063ef14f0Smrg	DBG(("%s: clearin SWCTRL LRI from %x\n",
251163ef14f0Smrg	     __FUNCTION__, kgem->bcs_state));
251263ef14f0Smrg
251363ef14f0Smrg	b = kgem->batch + kgem->nbatch;
251463ef14f0Smrg	kgem->nbatch += 7;
251563ef14f0Smrg
251663ef14f0Smrg	*b++ = MI_FLUSH_DW;
251763ef14f0Smrg	*b++ = 0;
251863ef14f0Smrg	*b++ = 0;
251963ef14f0Smrg	*b++ = 0;
252063ef14f0Smrg
252163ef14f0Smrg	*b++ = MI_LOAD_REGISTER_IMM;
252263ef14f0Smrg	*b++ = BCS_SWCTRL;
252363ef14f0Smrg	*b++ = (BCS_SRC_Y | BCS_DST_Y) << 16;
252463ef14f0Smrg
252563ef14f0Smrg	kgem->bcs_state = 0;
252663ef14f0Smrg}
252763ef14f0Smrg
252803b705cfSriastradhstatic uint32_t kgem_end_batch(struct kgem *kgem)
252903b705cfSriastradh{
253063ef14f0Smrg	kgem_clear_swctrl(kgem);
253103b705cfSriastradh	kgem->batch[kgem->nbatch++] = MI_BATCH_BUFFER_END;
253203b705cfSriastradh	if (kgem->nbatch & 1)
253303b705cfSriastradh		kgem->batch[kgem->nbatch++] = MI_NOOP;
253403b705cfSriastradh
253503b705cfSriastradh	return kgem->nbatch;
253603b705cfSriastradh}
253703b705cfSriastradh
253803b705cfSriastradhstatic void kgem_bo_binding_free(struct kgem *kgem, struct kgem_bo *bo)
253903b705cfSriastradh{
254003b705cfSriastradh	struct kgem_bo_binding *b;
254103b705cfSriastradh
254203b705cfSriastradh	b = bo->binding.next;
254303b705cfSriastradh	while (b) {
254403b705cfSriastradh		struct kgem_bo_binding *next = b->next;
25459a906b70Schristos		free(b);
254603b705cfSriastradh		b = next;
254703b705cfSriastradh	}
254803b705cfSriastradh}
254903b705cfSriastradh
255003b705cfSriastradhstatic void kgem_bo_free(struct kgem *kgem, struct kgem_bo *bo)
255103b705cfSriastradh{
25529a906b70Schristos	DBG(("%s: handle=%d, size=%d\n", __FUNCTION__, bo->handle, bytes(bo)));
255303b705cfSriastradh	assert(bo->refcnt == 0);
255403b705cfSriastradh	assert(bo->proxy == NULL);
255503b705cfSriastradh	assert(bo->exec == NULL);
255603b705cfSriastradh	assert(!bo->snoop || bo->rq == NULL);
255703b705cfSriastradh
255803b705cfSriastradh#ifdef DEBUG_MEMORY
255903b705cfSriastradh	kgem->debug_memory.bo_allocs--;
256003b705cfSriastradh	kgem->debug_memory.bo_bytes -= bytes(bo);
256103b705cfSriastradh#endif
256203b705cfSriastradh
256303b705cfSriastradh	kgem_bo_binding_free(kgem, bo);
25649a906b70Schristos	kgem_bo_rmfb(kgem, bo);
256503b705cfSriastradh
25669a906b70Schristos	if (IS_USER_MAP(bo->map__cpu)) {
256703b705cfSriastradh		assert(bo->rq == NULL);
256803b705cfSriastradh		assert(!__kgem_busy(kgem, bo->handle));
25699a906b70Schristos		assert(MAP(bo->map__cpu) != bo || bo->io || bo->flush);
257003b705cfSriastradh		if (!(bo->io || bo->flush)) {
257103b705cfSriastradh			DBG(("%s: freeing snooped base\n", __FUNCTION__));
25729a906b70Schristos			assert(bo != MAP(bo->map__cpu));
25739a906b70Schristos			free(MAP(bo->map__cpu));
257403b705cfSriastradh		}
25759a906b70Schristos		bo->map__cpu = NULL;
25769a906b70Schristos	}
25779a906b70Schristos
25789a906b70Schristos	DBG(("%s: releasing %p:%p vma for handle=%d, count=%d\n",
25799a906b70Schristos	     __FUNCTION__, bo->map__gtt, bo->map__cpu,
2580813957e3Ssnj	     bo->handle, list_is_empty(&bo->vma) ? 0 : kgem->vma[bo->map__gtt == NULL && bo->map__wc == NULL].count));
25819a906b70Schristos
25829a906b70Schristos	if (!list_is_empty(&bo->vma)) {
25839a906b70Schristos		_list_del(&bo->vma);
2584813957e3Ssnj		kgem->vma[bo->map__gtt == NULL && bo->map__wc == NULL].count--;
258503b705cfSriastradh	}
25869a906b70Schristos
25879a906b70Schristos	if (bo->map__gtt)
2588813957e3Ssnj		munmap(bo->map__gtt, bytes(bo));
2589813957e3Ssnj	if (bo->map__wc) {
2590813957e3Ssnj		VG(VALGRIND_MAKE_MEM_NOACCESS(bo->map__wc, bytes(bo)));
2591813957e3Ssnj		munmap(bo->map__wc, bytes(bo));
2592813957e3Ssnj	}
2593813957e3Ssnj	if (bo->map__cpu) {
2594813957e3Ssnj		VG(VALGRIND_MAKE_MEM_NOACCESS(MAP(bo->map__cpu), bytes(bo)));
25959a906b70Schristos		munmap(MAP(bo->map__cpu), bytes(bo));
2596813957e3Ssnj	}
259703b705cfSriastradh
259803b705cfSriastradh	_list_del(&bo->list);
259903b705cfSriastradh	_list_del(&bo->request);
260003b705cfSriastradh	gem_close(kgem->fd, bo->handle);
260103b705cfSriastradh
26029a906b70Schristos	if (!bo->io && !DBG_NO_MALLOC_CACHE) {
260303b705cfSriastradh		*(struct kgem_bo **)bo = __kgem_freed_bo;
260403b705cfSriastradh		__kgem_freed_bo = bo;
260503b705cfSriastradh	} else
260603b705cfSriastradh		free(bo);
260703b705cfSriastradh}
260803b705cfSriastradh
260903b705cfSriastradhinline static void kgem_bo_move_to_inactive(struct kgem *kgem,
261003b705cfSriastradh					    struct kgem_bo *bo)
261103b705cfSriastradh{
261203b705cfSriastradh	DBG(("%s: moving handle=%d to inactive\n", __FUNCTION__, bo->handle));
261303b705cfSriastradh
261403b705cfSriastradh	assert(bo->refcnt == 0);
261503b705cfSriastradh	assert(bo->reusable);
261603b705cfSriastradh	assert(bo->rq == NULL);
261703b705cfSriastradh	assert(bo->exec == NULL);
261803b705cfSriastradh	assert(bo->domain != DOMAIN_GPU);
261903b705cfSriastradh	assert(!bo->proxy);
262003b705cfSriastradh	assert(!bo->io);
262103b705cfSriastradh	assert(!bo->scanout);
262203b705cfSriastradh	assert(!bo->snoop);
262303b705cfSriastradh	assert(!bo->flush);
262403b705cfSriastradh	assert(!bo->needs_flush);
262563ef14f0Smrg	assert(!bo->delta);
262603b705cfSriastradh	assert(list_is_empty(&bo->vma));
262703b705cfSriastradh	assert_tiling(kgem, bo);
262863ef14f0Smrg	assert_caching(kgem, bo);
262903b705cfSriastradh	ASSERT_IDLE(kgem, bo->handle);
263003b705cfSriastradh
263103b705cfSriastradh	if (bucket(bo) >= NUM_CACHE_BUCKETS) {
26329a906b70Schristos		if (bo->map__gtt) {
263363ef14f0Smrg			DBG(("%s: relinquishing large GTT mapping for handle=%d\n",
263463ef14f0Smrg			     __FUNCTION__, bo->handle));
2635813957e3Ssnj			munmap(bo->map__gtt, bytes(bo));
26369a906b70Schristos			bo->map__gtt = NULL;
26379a906b70Schristos		}
263803b705cfSriastradh
26399a906b70Schristos		list_move(&bo->list, &kgem->large_inactive);
26409a906b70Schristos	} else {
26419a906b70Schristos		assert(bo->flush == false);
2642813957e3Ssnj		assert(list_is_empty(&bo->vma));
26439a906b70Schristos		list_move(&bo->list, &kgem->inactive[bucket(bo)]);
2644813957e3Ssnj		if (bo->map__gtt && !kgem_bo_can_map(kgem, bo)) {
264563ef14f0Smrg			DBG(("%s: relinquishing old GTT mapping for handle=%d\n",
264663ef14f0Smrg			     __FUNCTION__, bo->handle));
2647813957e3Ssnj			munmap(bo->map__gtt, bytes(bo));
2648813957e3Ssnj			bo->map__gtt = NULL;
264903b705cfSriastradh		}
2650813957e3Ssnj		if (bo->map__gtt || (bo->map__wc && !bo->tiling)) {
2651813957e3Ssnj			list_add(&bo->vma, &kgem->vma[0].inactive[bucket(bo)]);
2652813957e3Ssnj			kgem->vma[0].count++;
2653813957e3Ssnj		}
2654813957e3Ssnj		if (bo->map__cpu && list_is_empty(&bo->vma)) {
26559a906b70Schristos			list_add(&bo->vma, &kgem->vma[1].inactive[bucket(bo)]);
26569a906b70Schristos			kgem->vma[1].count++;
265703b705cfSriastradh		}
265803b705cfSriastradh	}
26599a906b70Schristos
26609a906b70Schristos	kgem->need_expire = true;
266103b705cfSriastradh}
266203b705cfSriastradh
266303b705cfSriastradhstatic struct kgem_bo *kgem_bo_replace_io(struct kgem_bo *bo)
266403b705cfSriastradh{
266503b705cfSriastradh	struct kgem_bo *base;
266603b705cfSriastradh
266703b705cfSriastradh	if (!bo->io)
266803b705cfSriastradh		return bo;
266903b705cfSriastradh
267003b705cfSriastradh	assert(!bo->snoop);
267163ef14f0Smrg	assert(!bo->purged);
267263ef14f0Smrg	assert(!bo->scanout);
267363ef14f0Smrg	assert(!bo->delta);
267463ef14f0Smrg
26759a906b70Schristos	if (__kgem_freed_bo) {
26769a906b70Schristos		base = __kgem_freed_bo;
26779a906b70Schristos		__kgem_freed_bo = *(struct kgem_bo **)base;
26789a906b70Schristos	} else
26799a906b70Schristos		base = malloc(sizeof(*base));
268003b705cfSriastradh	if (base) {
268103b705cfSriastradh		DBG(("%s: transferring io handle=%d to bo\n",
268203b705cfSriastradh		     __FUNCTION__, bo->handle));
268303b705cfSriastradh		/* transfer the handle to a minimum bo */
268403b705cfSriastradh		memcpy(base, bo, sizeof(*base));
268503b705cfSriastradh		base->io = false;
268603b705cfSriastradh		list_init(&base->list);
268703b705cfSriastradh		list_replace(&bo->request, &base->request);
268803b705cfSriastradh		list_replace(&bo->vma, &base->vma);
268903b705cfSriastradh		free(bo);
269003b705cfSriastradh		bo = base;
269103b705cfSriastradh	} else
269203b705cfSriastradh		bo->reusable = false;
269303b705cfSriastradh
269403b705cfSriastradh	return bo;
269503b705cfSriastradh}
269603b705cfSriastradh
269703b705cfSriastradhinline static void kgem_bo_remove_from_inactive(struct kgem *kgem,
269803b705cfSriastradh						struct kgem_bo *bo)
269903b705cfSriastradh{
270003b705cfSriastradh	DBG(("%s: removing handle=%d from inactive\n", __FUNCTION__, bo->handle));
270103b705cfSriastradh
270203b705cfSriastradh	list_del(&bo->list);
270303b705cfSriastradh	assert(bo->rq == NULL);
270403b705cfSriastradh	assert(bo->exec == NULL);
270563ef14f0Smrg	assert(!bo->purged);
27069a906b70Schristos	if (!list_is_empty(&bo->vma)) {
2707813957e3Ssnj		assert(bo->map__gtt || bo->map__wc || bo->map__cpu);
270803b705cfSriastradh		list_del(&bo->vma);
2709813957e3Ssnj		kgem->vma[bo->map__gtt == NULL && bo->map__wc == NULL].count--;
271003b705cfSriastradh	}
271103b705cfSriastradh}
271203b705cfSriastradh
271303b705cfSriastradhinline static void kgem_bo_remove_from_active(struct kgem *kgem,
271403b705cfSriastradh					      struct kgem_bo *bo)
271503b705cfSriastradh{
271603b705cfSriastradh	DBG(("%s: removing handle=%d from active\n", __FUNCTION__, bo->handle));
271703b705cfSriastradh
271803b705cfSriastradh	list_del(&bo->list);
271903b705cfSriastradh	assert(bo->rq != NULL);
27209a906b70Schristos	if (RQ(bo->rq) == (void *)kgem) {
27219a906b70Schristos		assert(bo->exec == NULL);
272203b705cfSriastradh		list_del(&bo->request);
27239a906b70Schristos	}
272403b705cfSriastradh	assert(list_is_empty(&bo->vma));
272503b705cfSriastradh}
272603b705cfSriastradh
272703b705cfSriastradhstatic void _kgem_bo_delete_buffer(struct kgem *kgem, struct kgem_bo *bo)
272803b705cfSriastradh{
272903b705cfSriastradh	struct kgem_buffer *io = (struct kgem_buffer *)bo->proxy;
273003b705cfSriastradh
273103b705cfSriastradh	DBG(("%s: size=%d, offset=%d, parent used=%d\n",
273203b705cfSriastradh	     __FUNCTION__, bo->size.bytes, bo->delta, io->used));
273303b705cfSriastradh
273403b705cfSriastradh	if (ALIGN(bo->delta + bo->size.bytes, UPLOAD_ALIGNMENT) == io->used)
273503b705cfSriastradh		io->used = bo->delta;
273603b705cfSriastradh}
273703b705cfSriastradh
273803b705cfSriastradhstatic bool check_scanout_size(struct kgem *kgem,
273903b705cfSriastradh			       struct kgem_bo *bo,
274003b705cfSriastradh			       int width, int height)
274103b705cfSriastradh{
274203b705cfSriastradh	struct drm_mode_fb_cmd info;
274303b705cfSriastradh
274403b705cfSriastradh	assert(bo->scanout);
274503b705cfSriastradh
274603b705cfSriastradh	VG_CLEAR(info);
274703b705cfSriastradh	info.fb_id = bo->delta;
274803b705cfSriastradh
27499a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_MODE_GETFB, &info))
275003b705cfSriastradh		return false;
275103b705cfSriastradh
275203b705cfSriastradh	gem_close(kgem->fd, info.handle);
275303b705cfSriastradh
275463ef14f0Smrg	if (width > info.width || height > info.height) {
275503b705cfSriastradh		DBG(("%s: not using scanout %d (%dx%d), want (%dx%d)\n",
275603b705cfSriastradh		     __FUNCTION__,
275703b705cfSriastradh		     info.fb_id, info.width, info.height,
275803b705cfSriastradh		     width, height));
275903b705cfSriastradh		return false;
276003b705cfSriastradh	}
276103b705cfSriastradh
276203b705cfSriastradh	return true;
276303b705cfSriastradh}
276403b705cfSriastradh
276503b705cfSriastradhstatic void kgem_bo_move_to_scanout(struct kgem *kgem, struct kgem_bo *bo)
276603b705cfSriastradh{
276703b705cfSriastradh	assert(bo->refcnt == 0);
276803b705cfSriastradh	assert(bo->scanout);
276903b705cfSriastradh	assert(!bo->flush);
277003b705cfSriastradh	assert(!bo->snoop);
277103b705cfSriastradh	assert(!bo->io);
277203b705cfSriastradh
27739a906b70Schristos	if (bo->purged) { /* for stolen fb */
27749a906b70Schristos		if (!bo->exec) {
27759a906b70Schristos			DBG(("%s: discarding purged scanout - stolen?\n",
27769a906b70Schristos			     __FUNCTION__));
27779a906b70Schristos			kgem_bo_free(kgem, bo);
27789a906b70Schristos		}
277903b705cfSriastradh		return;
278003b705cfSriastradh	}
278103b705cfSriastradh
278203b705cfSriastradh	DBG(("%s: moving %d [fb %d] to scanout cache, active? %d\n",
278303b705cfSriastradh	     __FUNCTION__, bo->handle, bo->delta, bo->rq != NULL));
278403b705cfSriastradh	if (bo->rq)
278503b705cfSriastradh		list_move_tail(&bo->list, &kgem->scanout);
278603b705cfSriastradh	else
278703b705cfSriastradh		list_move(&bo->list, &kgem->scanout);
27889a906b70Schristos
27899a906b70Schristos	kgem->need_expire = true;
279003b705cfSriastradh}
279103b705cfSriastradh
279203b705cfSriastradhstatic void kgem_bo_move_to_snoop(struct kgem *kgem, struct kgem_bo *bo)
279303b705cfSriastradh{
279403b705cfSriastradh	assert(bo->reusable);
27959a906b70Schristos	assert(!bo->scanout);
279603b705cfSriastradh	assert(!bo->flush);
279703b705cfSriastradh	assert(!bo->needs_flush);
279803b705cfSriastradh	assert(bo->refcnt == 0);
279903b705cfSriastradh	assert(bo->exec == NULL);
280063ef14f0Smrg	assert(!bo->purged);
280163ef14f0Smrg	assert(!bo->delta);
280203b705cfSriastradh
28039a906b70Schristos	if (DBG_NO_SNOOP_CACHE) {
28049a906b70Schristos		kgem_bo_free(kgem, bo);
28059a906b70Schristos		return;
28069a906b70Schristos	}
28079a906b70Schristos
280803b705cfSriastradh	if (num_pages(bo) > kgem->max_cpu_size >> 13) {
280903b705cfSriastradh		DBG(("%s handle=%d discarding large CPU buffer (%d >%d pages)\n",
281003b705cfSriastradh		     __FUNCTION__, bo->handle, num_pages(bo), kgem->max_cpu_size >> 13));
281103b705cfSriastradh		kgem_bo_free(kgem, bo);
281203b705cfSriastradh		return;
281303b705cfSriastradh	}
281403b705cfSriastradh
281503b705cfSriastradh	assert(bo->tiling == I915_TILING_NONE);
281603b705cfSriastradh	assert(bo->rq == NULL);
281703b705cfSriastradh
281803b705cfSriastradh	DBG(("%s: moving %d to snoop cachee\n", __FUNCTION__, bo->handle));
281903b705cfSriastradh	list_add(&bo->list, &kgem->snoop);
28209a906b70Schristos	kgem->need_expire = true;
28219a906b70Schristos}
28229a906b70Schristos
28239a906b70Schristosstatic bool kgem_bo_move_to_cache(struct kgem *kgem, struct kgem_bo *bo)
28249a906b70Schristos{
28259a906b70Schristos	bool retired = false;
28269a906b70Schristos
28279a906b70Schristos	DBG(("%s: release handle=%d\n", __FUNCTION__, bo->handle));
28289a906b70Schristos
28299a906b70Schristos	if (bo->prime) {
28309a906b70Schristos		DBG(("%s: discarding imported prime handle=%d\n",
28319a906b70Schristos		     __FUNCTION__, bo->handle));
28329a906b70Schristos		kgem_bo_free(kgem, bo);
28339a906b70Schristos	} else if (bo->snoop) {
28349a906b70Schristos		kgem_bo_move_to_snoop(kgem, bo);
28359a906b70Schristos	} else if (bo->scanout) {
28369a906b70Schristos		kgem_bo_move_to_scanout(kgem, bo);
283763ef14f0Smrg	} else if ((bo = kgem_bo_replace_io(bo))->reusable) {
28389a906b70Schristos		kgem_bo_move_to_inactive(kgem, bo);
28399a906b70Schristos		retired = true;
28409a906b70Schristos	} else
28419a906b70Schristos		kgem_bo_free(kgem, bo);
28429a906b70Schristos
28439a906b70Schristos	return retired;
284403b705cfSriastradh}
284503b705cfSriastradh
284603b705cfSriastradhstatic struct kgem_bo *
284703b705cfSriastradhsearch_snoop_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags)
284803b705cfSriastradh{
284903b705cfSriastradh	struct kgem_bo *bo, *first = NULL;
285003b705cfSriastradh
285103b705cfSriastradh	DBG(("%s: num_pages=%d, flags=%x\n", __FUNCTION__, num_pages, flags));
285203b705cfSriastradh
285303b705cfSriastradh	if ((kgem->has_caching | kgem->has_userptr) == 0)
285403b705cfSriastradh		return NULL;
285503b705cfSriastradh
285603b705cfSriastradh	if (list_is_empty(&kgem->snoop)) {
285703b705cfSriastradh		DBG(("%s: inactive and cache empty\n", __FUNCTION__));
285803b705cfSriastradh		if (!__kgem_throttle_retire(kgem, flags)) {
285903b705cfSriastradh			DBG(("%s: nothing retired\n", __FUNCTION__));
286003b705cfSriastradh			return NULL;
286103b705cfSriastradh		}
286203b705cfSriastradh	}
286303b705cfSriastradh
286403b705cfSriastradh	list_for_each_entry(bo, &kgem->snoop, list) {
286503b705cfSriastradh		assert(bo->refcnt == 0);
286603b705cfSriastradh		assert(bo->snoop);
286703b705cfSriastradh		assert(!bo->scanout);
286803b705cfSriastradh		assert(!bo->purged);
286903b705cfSriastradh		assert(bo->proxy == NULL);
287003b705cfSriastradh		assert(bo->tiling == I915_TILING_NONE);
287103b705cfSriastradh		assert(bo->rq == NULL);
287203b705cfSriastradh		assert(bo->exec == NULL);
287303b705cfSriastradh
287403b705cfSriastradh		if (num_pages > num_pages(bo))
287503b705cfSriastradh			continue;
287603b705cfSriastradh
287703b705cfSriastradh		if (num_pages(bo) > 2*num_pages) {
287803b705cfSriastradh			if (first == NULL)
287903b705cfSriastradh				first = bo;
288003b705cfSriastradh			continue;
288103b705cfSriastradh		}
288203b705cfSriastradh
288303b705cfSriastradh		list_del(&bo->list);
288403b705cfSriastradh		bo->pitch = 0;
288503b705cfSriastradh		bo->delta = 0;
288603b705cfSriastradh
288703b705cfSriastradh		DBG(("  %s: found handle=%d (num_pages=%d) in snoop cache\n",
288803b705cfSriastradh		     __FUNCTION__, bo->handle, num_pages(bo)));
288903b705cfSriastradh		return bo;
289003b705cfSriastradh	}
289103b705cfSriastradh
289203b705cfSriastradh	if (first) {
289303b705cfSriastradh		list_del(&first->list);
289403b705cfSriastradh		first->pitch = 0;
289503b705cfSriastradh		first->delta = 0;
289603b705cfSriastradh
289703b705cfSriastradh		DBG(("  %s: found handle=%d (num_pages=%d) in snoop cache\n",
289803b705cfSriastradh		     __FUNCTION__, first->handle, num_pages(first)));
289903b705cfSriastradh		return first;
290003b705cfSriastradh	}
290103b705cfSriastradh
290203b705cfSriastradh	return NULL;
290303b705cfSriastradh}
290403b705cfSriastradh
290503b705cfSriastradhvoid kgem_bo_undo(struct kgem *kgem, struct kgem_bo *bo)
290603b705cfSriastradh{
290703b705cfSriastradh	if (kgem->nexec != 1 || bo->exec == NULL)
290803b705cfSriastradh		return;
290903b705cfSriastradh
29109a906b70Schristos	assert(bo);
291103b705cfSriastradh	DBG(("%s: only handle in batch, discarding last operations for handle=%d\n",
291203b705cfSriastradh	     __FUNCTION__, bo->handle));
291303b705cfSriastradh
291463ef14f0Smrg	assert(bo->exec == &_kgem_dummy_exec || bo->exec == &kgem->exec[0]);
291503b705cfSriastradh	assert(kgem->exec[0].handle == bo->handle);
291603b705cfSriastradh	assert(RQ(bo->rq) == kgem->next_request);
291703b705cfSriastradh
291803b705cfSriastradh	bo->refcnt++;
291903b705cfSriastradh	kgem_reset(kgem);
292003b705cfSriastradh	bo->refcnt--;
29219a906b70Schristos
29229a906b70Schristos	assert(kgem->nreloc == 0);
29239a906b70Schristos	assert(kgem->nexec == 0);
29249a906b70Schristos	assert(bo->exec == NULL);
292503b705cfSriastradh}
292603b705cfSriastradh
29279a906b70Schristosvoid kgem_bo_pair_undo(struct kgem *kgem, struct kgem_bo *a, struct kgem_bo *b)
292803b705cfSriastradh{
29299a906b70Schristos	if (kgem->nexec > 2)
29309a906b70Schristos		return;
293103b705cfSriastradh
29329a906b70Schristos	if (kgem->nexec == 1) {
29339a906b70Schristos		if (a)
29349a906b70Schristos			kgem_bo_undo(kgem, a);
29359a906b70Schristos		if (b)
29369a906b70Schristos			kgem_bo_undo(kgem, b);
29379a906b70Schristos		return;
29389a906b70Schristos	}
29399a906b70Schristos
29409a906b70Schristos	if (a == NULL || b == NULL)
29419a906b70Schristos		return;
294263ef14f0Smrg	assert(a != b);
29439a906b70Schristos	if (a->exec == NULL || b->exec == NULL)
29449a906b70Schristos		return;
29459a906b70Schristos
294663ef14f0Smrg	DBG(("%s: only handles in batch, discarding last operations for handle=%d (index=%d) and handle=%d (index=%d)\n",
294763ef14f0Smrg	     __FUNCTION__,
294863ef14f0Smrg	     a->handle, a->proxy ? -1 : a->exec - kgem->exec,
294963ef14f0Smrg	     b->handle, b->proxy ? -1 : b->exec - kgem->exec));
29509a906b70Schristos
295163ef14f0Smrg	assert(a->exec == &_kgem_dummy_exec ||
295263ef14f0Smrg	       a->exec == &kgem->exec[0] ||
295363ef14f0Smrg	       a->exec == &kgem->exec[1]);
29549a906b70Schristos	assert(a->handle == kgem->exec[0].handle || a->handle == kgem->exec[1].handle);
29559a906b70Schristos	assert(RQ(a->rq) == kgem->next_request);
295663ef14f0Smrg	assert(b->exec == &_kgem_dummy_exec ||
295763ef14f0Smrg	       b->exec == &kgem->exec[0] ||
295863ef14f0Smrg	       b->exec == &kgem->exec[1]);
29599a906b70Schristos	assert(b->handle == kgem->exec[0].handle || b->handle == kgem->exec[1].handle);
29609a906b70Schristos	assert(RQ(b->rq) == kgem->next_request);
29619a906b70Schristos
29629a906b70Schristos	a->refcnt++;
29639a906b70Schristos	b->refcnt++;
29649a906b70Schristos	kgem_reset(kgem);
29659a906b70Schristos	b->refcnt--;
29669a906b70Schristos	a->refcnt--;
29679a906b70Schristos
29689a906b70Schristos	assert(kgem->nreloc == 0);
29699a906b70Schristos	assert(kgem->nexec == 0);
29709a906b70Schristos	assert(a->exec == NULL);
29719a906b70Schristos	assert(b->exec == NULL);
29729a906b70Schristos}
29739a906b70Schristos
29749a906b70Schristosstatic void __kgem_bo_destroy(struct kgem *kgem, struct kgem_bo *bo)
29759a906b70Schristos{
29769a906b70Schristos	DBG(("%s: handle=%d, size=%d\n", __FUNCTION__, bo->handle, bytes(bo)));
29779a906b70Schristos
29789a906b70Schristos	assert(list_is_empty(&bo->list));
297963ef14f0Smrg	assert(list_is_empty(&bo->vma));
29809a906b70Schristos	assert(bo->refcnt == 0);
29819a906b70Schristos	assert(bo->proxy == NULL);
29829a906b70Schristos	assert(bo->active_scanout == 0);
29839a906b70Schristos	assert_tiling(kgem, bo);
29849a906b70Schristos
29859a906b70Schristos	bo->binding.offset = 0;
298603b705cfSriastradh
298703b705cfSriastradh	if (DBG_NO_CACHE)
298803b705cfSriastradh		goto destroy;
298903b705cfSriastradh
29909a906b70Schristos	if (bo->prime)
29919a906b70Schristos		goto destroy;
29929a906b70Schristos
299303b705cfSriastradh	if (bo->snoop && !bo->flush) {
299403b705cfSriastradh		DBG(("%s: handle=%d is snooped\n", __FUNCTION__, bo->handle));
299503b705cfSriastradh		assert(bo->reusable);
299603b705cfSriastradh		assert(list_is_empty(&bo->list));
299703b705cfSriastradh		if (bo->exec == NULL && bo->rq && !__kgem_busy(kgem, bo->handle))
299803b705cfSriastradh			__kgem_bo_clear_busy(bo);
299903b705cfSriastradh		if (bo->rq == NULL)
300003b705cfSriastradh			kgem_bo_move_to_snoop(kgem, bo);
300103b705cfSriastradh		return;
300203b705cfSriastradh	}
30039a906b70Schristos	if (!IS_USER_MAP(bo->map__cpu))
300403b705cfSriastradh		bo->flush = false;
300503b705cfSriastradh
300603b705cfSriastradh	if (bo->scanout) {
300703b705cfSriastradh		kgem_bo_move_to_scanout(kgem, bo);
300803b705cfSriastradh		return;
300903b705cfSriastradh	}
301003b705cfSriastradh
301103b705cfSriastradh	if (bo->io)
301203b705cfSriastradh		bo = kgem_bo_replace_io(bo);
301303b705cfSriastradh	if (!bo->reusable) {
301403b705cfSriastradh		DBG(("%s: handle=%d, not reusable\n",
301503b705cfSriastradh		     __FUNCTION__, bo->handle));
301603b705cfSriastradh		goto destroy;
301703b705cfSriastradh	}
301803b705cfSriastradh
301903b705cfSriastradh	assert(list_is_empty(&bo->vma));
302003b705cfSriastradh	assert(list_is_empty(&bo->list));
302103b705cfSriastradh	assert(bo->flush == false);
302203b705cfSriastradh	assert(bo->snoop == false);
302303b705cfSriastradh	assert(bo->io == false);
302403b705cfSriastradh	assert(bo->scanout == false);
302563ef14f0Smrg	assert_caching(kgem, bo);
302603b705cfSriastradh
302703b705cfSriastradh	kgem_bo_undo(kgem, bo);
302803b705cfSriastradh	assert(bo->refcnt == 0);
302903b705cfSriastradh
303003b705cfSriastradh	if (bo->rq && bo->exec == NULL && !__kgem_busy(kgem, bo->handle))
303103b705cfSriastradh		__kgem_bo_clear_busy(bo);
303203b705cfSriastradh
303303b705cfSriastradh	if (bo->rq) {
303403b705cfSriastradh		struct list *cache;
303503b705cfSriastradh
303603b705cfSriastradh		DBG(("%s: handle=%d -> active\n", __FUNCTION__, bo->handle));
303703b705cfSriastradh		if (bucket(bo) < NUM_CACHE_BUCKETS)
303803b705cfSriastradh			cache = &kgem->active[bucket(bo)][bo->tiling];
303903b705cfSriastradh		else
304003b705cfSriastradh			cache = &kgem->large;
304103b705cfSriastradh		list_add(&bo->list, cache);
304203b705cfSriastradh		return;
304303b705cfSriastradh	}
304403b705cfSriastradh
304503b705cfSriastradh	assert(bo->exec == NULL);
304603b705cfSriastradh	assert(list_is_empty(&bo->request));
304703b705cfSriastradh
30489a906b70Schristos	if (bo->map__cpu == NULL || bucket(bo) >= NUM_CACHE_BUCKETS) {
304903b705cfSriastradh		if (!kgem->has_llc && bo->domain == DOMAIN_CPU)
305003b705cfSriastradh			goto destroy;
305103b705cfSriastradh
305203b705cfSriastradh		DBG(("%s: handle=%d, purged\n",
305303b705cfSriastradh		     __FUNCTION__, bo->handle));
305403b705cfSriastradh	}
305503b705cfSriastradh
305603b705cfSriastradh	kgem_bo_move_to_inactive(kgem, bo);
305703b705cfSriastradh	return;
305803b705cfSriastradh
305903b705cfSriastradhdestroy:
306003b705cfSriastradh	if (!bo->exec)
306103b705cfSriastradh		kgem_bo_free(kgem, bo);
306203b705cfSriastradh}
306303b705cfSriastradh
306403b705cfSriastradhstatic void kgem_bo_unref(struct kgem *kgem, struct kgem_bo *bo)
306503b705cfSriastradh{
306603b705cfSriastradh	assert(bo->refcnt);
306703b705cfSriastradh	if (--bo->refcnt == 0)
306803b705cfSriastradh		__kgem_bo_destroy(kgem, bo);
306903b705cfSriastradh}
307003b705cfSriastradh
307103b705cfSriastradhstatic void kgem_buffer_release(struct kgem *kgem, struct kgem_buffer *bo)
307203b705cfSriastradh{
30739a906b70Schristos	assert(bo->base.io);
307403b705cfSriastradh	while (!list_is_empty(&bo->base.vma)) {
307503b705cfSriastradh		struct kgem_bo *cached;
307603b705cfSriastradh
307703b705cfSriastradh		cached = list_first_entry(&bo->base.vma, struct kgem_bo, vma);
307803b705cfSriastradh		assert(cached->proxy == &bo->base);
30799a906b70Schristos		assert(cached != &bo->base);
308003b705cfSriastradh		list_del(&cached->vma);
308103b705cfSriastradh
30829a906b70Schristos		assert(*(struct kgem_bo **)cached->map__gtt == cached);
30839a906b70Schristos		*(struct kgem_bo **)cached->map__gtt = NULL;
30849a906b70Schristos		cached->map__gtt = NULL;
308503b705cfSriastradh
308603b705cfSriastradh		kgem_bo_destroy(kgem, cached);
308703b705cfSriastradh	}
308803b705cfSriastradh}
308903b705cfSriastradh
30909a906b70Schristosvoid kgem_retire__buffers(struct kgem *kgem)
309103b705cfSriastradh{
309203b705cfSriastradh	while (!list_is_empty(&kgem->active_buffers)) {
309303b705cfSriastradh		struct kgem_buffer *bo =
309403b705cfSriastradh			list_last_entry(&kgem->active_buffers,
309503b705cfSriastradh					struct kgem_buffer,
309603b705cfSriastradh					base.list);
309703b705cfSriastradh
30989a906b70Schristos		DBG(("%s: handle=%d, busy? %d [%d]\n",
30999a906b70Schristos		     __FUNCTION__, bo->base.handle, bo->base.rq != NULL, bo->base.exec != NULL));
31009a906b70Schristos
31019a906b70Schristos		assert(bo->base.exec == NULL || RQ(bo->base.rq) == kgem->next_request);
310203b705cfSriastradh		if (bo->base.rq)
310303b705cfSriastradh			break;
310403b705cfSriastradh
310503b705cfSriastradh		DBG(("%s: releasing upload cache for handle=%d? %d\n",
310603b705cfSriastradh		     __FUNCTION__, bo->base.handle, !list_is_empty(&bo->base.vma)));
310703b705cfSriastradh		list_del(&bo->base.list);
310803b705cfSriastradh		kgem_buffer_release(kgem, bo);
310903b705cfSriastradh		kgem_bo_unref(kgem, &bo->base);
311003b705cfSriastradh	}
311103b705cfSriastradh}
311203b705cfSriastradh
311303b705cfSriastradhstatic bool kgem_retire__flushing(struct kgem *kgem)
311403b705cfSriastradh{
311503b705cfSriastradh	struct kgem_bo *bo, *next;
311603b705cfSriastradh	bool retired = false;
311703b705cfSriastradh
311803b705cfSriastradh	list_for_each_entry_safe(bo, next, &kgem->flushing, request) {
31199a906b70Schristos		assert(RQ(bo->rq) == (void *)kgem);
312003b705cfSriastradh		assert(bo->exec == NULL);
312103b705cfSriastradh
312203b705cfSriastradh		if (__kgem_busy(kgem, bo->handle))
312303b705cfSriastradh			break;
312403b705cfSriastradh
312503b705cfSriastradh		__kgem_bo_clear_busy(bo);
312603b705cfSriastradh
312703b705cfSriastradh		if (bo->refcnt)
312803b705cfSriastradh			continue;
312903b705cfSriastradh
31309a906b70Schristos		retired |= kgem_bo_move_to_cache(kgem, bo);
313103b705cfSriastradh	}
313203b705cfSriastradh#if HAS_DEBUG_FULL
313303b705cfSriastradh	{
313403b705cfSriastradh		int count = 0;
313503b705cfSriastradh		list_for_each_entry(bo, &kgem->flushing, request)
313603b705cfSriastradh			count++;
313763ef14f0Smrg		DBG(("%s: %d bo on flushing list, retired? %d\n", __FUNCTION__, count, retired));
313803b705cfSriastradh	}
313903b705cfSriastradh#endif
314003b705cfSriastradh
314103b705cfSriastradh	kgem->need_retire |= !list_is_empty(&kgem->flushing);
314203b705cfSriastradh
314303b705cfSriastradh	return retired;
314403b705cfSriastradh}
314503b705cfSriastradh
314663ef14f0Smrgstatic bool __kgem_bo_flush(struct kgem *kgem, struct kgem_bo *bo)
314763ef14f0Smrg{
314863ef14f0Smrg	struct drm_i915_gem_busy busy;
314963ef14f0Smrg
315063ef14f0Smrg	if (!bo->needs_flush)
315163ef14f0Smrg		return false;
315263ef14f0Smrg
315363ef14f0Smrg	bo->needs_flush = false;
315463ef14f0Smrg
315563ef14f0Smrg	VG_CLEAR(busy);
315663ef14f0Smrg	busy.handle = bo->handle;
315763ef14f0Smrg	busy.busy = !kgem->wedged;
315863ef14f0Smrg	(void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_BUSY, &busy);
315963ef14f0Smrg	DBG(("%s: handle=%d, busy=%d, wedged=%d\n",
316063ef14f0Smrg	     __FUNCTION__, bo->handle, busy.busy, kgem->wedged));
316163ef14f0Smrg
316263ef14f0Smrg	if (busy.busy == 0)
316363ef14f0Smrg		return false;
316463ef14f0Smrg
316563ef14f0Smrg	DBG(("%s: moving %d to flushing\n",
316663ef14f0Smrg	     __FUNCTION__, bo->handle));
316763ef14f0Smrg	list_add(&bo->request, &kgem->flushing);
316863ef14f0Smrg	bo->rq = MAKE_REQUEST(kgem, !!(busy.busy & ~0x1ffff));
316963ef14f0Smrg	bo->needs_flush = busy.busy & 0xffff;
317063ef14f0Smrg	kgem->need_retire = true;
317163ef14f0Smrg	return true;
317263ef14f0Smrg}
317363ef14f0Smrg
317403b705cfSriastradhstatic bool __kgem_retire_rq(struct kgem *kgem, struct kgem_request *rq)
317503b705cfSriastradh{
317603b705cfSriastradh	bool retired = false;
317703b705cfSriastradh
317803b705cfSriastradh	DBG(("%s: request %d complete\n",
317903b705cfSriastradh	     __FUNCTION__, rq->bo->handle));
31809a906b70Schristos	assert(RQ(rq->bo->rq) == rq);
318163ef14f0Smrg	assert(rq != (struct kgem_request *)kgem);
318263ef14f0Smrg	assert(rq != &kgem->static_request);
318303b705cfSriastradh
3184813957e3Ssnj	if (rq == kgem->fence[rq->ring])
3185813957e3Ssnj		kgem->fence[rq->ring] = NULL;
3186813957e3Ssnj
318703b705cfSriastradh	while (!list_is_empty(&rq->buffers)) {
318803b705cfSriastradh		struct kgem_bo *bo;
318903b705cfSriastradh
319003b705cfSriastradh		bo = list_first_entry(&rq->buffers,
319103b705cfSriastradh				      struct kgem_bo,
319203b705cfSriastradh				      request);
319303b705cfSriastradh
319403b705cfSriastradh		assert(RQ(bo->rq) == rq);
319503b705cfSriastradh		assert(bo->exec == NULL);
319603b705cfSriastradh		assert(bo->domain == DOMAIN_GPU || bo->domain == DOMAIN_NONE);
319703b705cfSriastradh
319803b705cfSriastradh		list_del(&bo->request);
319903b705cfSriastradh
320063ef14f0Smrg		if (unlikely(__kgem_bo_flush(kgem, bo))) {
320163ef14f0Smrg			assert(bo != rq->bo);
320263ef14f0Smrg			DBG(("%s: movied %d to flushing\n",
320303b705cfSriastradh			     __FUNCTION__, bo->handle));
320403b705cfSriastradh			continue;
320503b705cfSriastradh		}
320603b705cfSriastradh
320703b705cfSriastradh		bo->domain = DOMAIN_NONE;
320803b705cfSriastradh		bo->rq = NULL;
320903b705cfSriastradh		if (bo->refcnt)
321003b705cfSriastradh			continue;
321103b705cfSriastradh
32129a906b70Schristos		retired |= kgem_bo_move_to_cache(kgem, bo);
321303b705cfSriastradh	}
321403b705cfSriastradh
321503b705cfSriastradh	assert(rq->bo->rq == NULL);
32169a906b70Schristos	assert(rq->bo->exec == NULL);
321703b705cfSriastradh	assert(list_is_empty(&rq->bo->request));
32189a906b70Schristos	assert(rq->bo->refcnt > 0);
321903b705cfSriastradh
322003b705cfSriastradh	if (--rq->bo->refcnt == 0) {
322163ef14f0Smrg		kgem_bo_move_to_inactive(kgem, rq->bo);
322263ef14f0Smrg		retired = true;
322303b705cfSriastradh	}
322403b705cfSriastradh
322503b705cfSriastradh	__kgem_request_free(rq);
322603b705cfSriastradh	return retired;
322703b705cfSriastradh}
322803b705cfSriastradh
322903b705cfSriastradhstatic bool kgem_retire__requests_ring(struct kgem *kgem, int ring)
323003b705cfSriastradh{
323103b705cfSriastradh	bool retired = false;
323203b705cfSriastradh
323363ef14f0Smrg	assert(ring < ARRAY_SIZE(kgem->requests));
323403b705cfSriastradh	while (!list_is_empty(&kgem->requests[ring])) {
323503b705cfSriastradh		struct kgem_request *rq;
323603b705cfSriastradh
323763ef14f0Smrg		DBG(("%s: retiring ring %d\n", __FUNCTION__, ring));
323863ef14f0Smrg
323903b705cfSriastradh		rq = list_first_entry(&kgem->requests[ring],
324003b705cfSriastradh				      struct kgem_request,
324103b705cfSriastradh				      list);
32429a906b70Schristos		assert(rq->ring == ring);
324363ef14f0Smrg		assert(rq->bo);
324463ef14f0Smrg		assert(RQ(rq->bo->rq) == rq);
324503b705cfSriastradh		if (__kgem_busy(kgem, rq->bo->handle))
324603b705cfSriastradh			break;
324703b705cfSriastradh
324803b705cfSriastradh		retired |= __kgem_retire_rq(kgem, rq);
324903b705cfSriastradh	}
325003b705cfSriastradh
325103b705cfSriastradh#if HAS_DEBUG_FULL
325203b705cfSriastradh	{
325303b705cfSriastradh		struct kgem_bo *bo;
325403b705cfSriastradh		int count = 0;
325503b705cfSriastradh
325603b705cfSriastradh		list_for_each_entry(bo, &kgem->requests[ring], request)
325703b705cfSriastradh			count++;
325803b705cfSriastradh
325903b705cfSriastradh		bo = NULL;
326003b705cfSriastradh		if (!list_is_empty(&kgem->requests[ring]))
326103b705cfSriastradh			bo = list_first_entry(&kgem->requests[ring],
326203b705cfSriastradh					      struct kgem_request,
326303b705cfSriastradh					      list)->bo;
326403b705cfSriastradh
326563ef14f0Smrg		DBG(("%s: ring=%d, %d outstanding requests, oldest=%d, retired? %d\n",
326663ef14f0Smrg		     __FUNCTION__, ring, count, bo ? bo->handle : 0, retired));
326703b705cfSriastradh	}
326803b705cfSriastradh#endif
326903b705cfSriastradh
327003b705cfSriastradh	return retired;
327103b705cfSriastradh}
327203b705cfSriastradh
327303b705cfSriastradhstatic bool kgem_retire__requests(struct kgem *kgem)
327403b705cfSriastradh{
327503b705cfSriastradh	bool retired = false;
327603b705cfSriastradh	int n;
327703b705cfSriastradh
327803b705cfSriastradh	for (n = 0; n < ARRAY_SIZE(kgem->requests); n++) {
327903b705cfSriastradh		retired |= kgem_retire__requests_ring(kgem, n);
328003b705cfSriastradh		kgem->need_retire |= !list_is_empty(&kgem->requests[n]);
328103b705cfSriastradh	}
328203b705cfSriastradh
328303b705cfSriastradh	return retired;
328403b705cfSriastradh}
328503b705cfSriastradh
328603b705cfSriastradhbool kgem_retire(struct kgem *kgem)
328703b705cfSriastradh{
328803b705cfSriastradh	bool retired = false;
328903b705cfSriastradh
32909a906b70Schristos	DBG(("%s, need_retire?=%d\n", __FUNCTION__, kgem->need_retire));
329103b705cfSriastradh
329203b705cfSriastradh	kgem->need_retire = false;
329303b705cfSriastradh
329403b705cfSriastradh	retired |= kgem_retire__flushing(kgem);
329503b705cfSriastradh	retired |= kgem_retire__requests(kgem);
329603b705cfSriastradh
329703b705cfSriastradh	DBG(("%s -- retired=%d, need_retire=%d\n",
329803b705cfSriastradh	     __FUNCTION__, retired, kgem->need_retire));
329903b705cfSriastradh
330003b705cfSriastradh	kgem->retire(kgem);
330103b705cfSriastradh
330203b705cfSriastradh	return retired;
330303b705cfSriastradh}
330403b705cfSriastradh
330503b705cfSriastradhbool __kgem_ring_is_idle(struct kgem *kgem, int ring)
330603b705cfSriastradh{
330703b705cfSriastradh	struct kgem_request *rq;
330803b705cfSriastradh
33099a906b70Schristos	assert(ring < ARRAY_SIZE(kgem->requests));
331003b705cfSriastradh	assert(!list_is_empty(&kgem->requests[ring]));
331103b705cfSriastradh
3312813957e3Ssnj	rq = kgem->fence[ring];
3313813957e3Ssnj	if (rq) {
3314813957e3Ssnj		struct kgem_request *tmp;
3315813957e3Ssnj
3316813957e3Ssnj		if (__kgem_busy(kgem, rq->bo->handle)) {
3317813957e3Ssnj			DBG(("%s: last fence handle=%d still busy\n",
3318813957e3Ssnj			     __FUNCTION__, rq->bo->handle));
3319813957e3Ssnj			return false;
3320813957e3Ssnj		}
3321813957e3Ssnj
3322813957e3Ssnj		do {
3323813957e3Ssnj			tmp = list_first_entry(&kgem->requests[ring],
3324813957e3Ssnj					       struct kgem_request,
3325813957e3Ssnj					       list);
3326813957e3Ssnj			assert(tmp->ring == ring);
3327813957e3Ssnj			__kgem_retire_rq(kgem, tmp);
3328813957e3Ssnj		} while (tmp != rq);
3329813957e3Ssnj
3330813957e3Ssnj		assert(kgem->fence[ring] == NULL);
3331813957e3Ssnj		if (list_is_empty(&kgem->requests[ring]))
3332813957e3Ssnj			return true;
3333813957e3Ssnj	}
3334813957e3Ssnj
333503b705cfSriastradh	rq = list_last_entry(&kgem->requests[ring],
333603b705cfSriastradh			     struct kgem_request, list);
33379a906b70Schristos	assert(rq->ring == ring);
333863ef14f0Smrg	assert(rq->bo);
333963ef14f0Smrg	assert(RQ(rq->bo->rq) == rq);
334003b705cfSriastradh	if (__kgem_busy(kgem, rq->bo->handle)) {
334103b705cfSriastradh		DBG(("%s: last requests handle=%d still busy\n",
334203b705cfSriastradh		     __FUNCTION__, rq->bo->handle));
3343813957e3Ssnj		kgem->fence[ring] = rq;
334403b705cfSriastradh		return false;
334503b705cfSriastradh	}
334603b705cfSriastradh
334703b705cfSriastradh	DBG(("%s: ring=%d idle (handle=%d)\n",
334803b705cfSriastradh	     __FUNCTION__, ring, rq->bo->handle));
334903b705cfSriastradh
3350813957e3Ssnj	while (!list_is_empty(&kgem->requests[ring])) {
3351813957e3Ssnj		rq = list_first_entry(&kgem->requests[ring],
3352813957e3Ssnj				      struct kgem_request,
3353813957e3Ssnj				      list);
3354813957e3Ssnj		assert(rq->ring == ring);
3355813957e3Ssnj		__kgem_retire_rq(kgem, rq);
3356813957e3Ssnj	}
33579a906b70Schristos
335803b705cfSriastradh	return true;
335903b705cfSriastradh}
336003b705cfSriastradh
336163ef14f0Smrgbool __kgem_retire_requests_upto(struct kgem *kgem, struct kgem_bo *bo)
3362813957e3Ssnj{
336363ef14f0Smrg	struct kgem_request * const rq = RQ(bo->rq), *tmp;
336463ef14f0Smrg	struct list *requests = &kgem->requests[rq->ring];
336563ef14f0Smrg
336663ef14f0Smrg	DBG(("%s(handle=%d, ring=%d)\n", __FUNCTION__, bo->handle, rq->ring));
3367813957e3Ssnj
3368813957e3Ssnj	assert(rq != &kgem->static_request);
3369813957e3Ssnj	if (rq == (struct kgem_request *)kgem) {
3370813957e3Ssnj		__kgem_bo_clear_busy(bo);
337163ef14f0Smrg		return false;
3372813957e3Ssnj	}
3373813957e3Ssnj
337463ef14f0Smrg	assert(rq->ring < ARRAY_SIZE(kgem->requests));
3375813957e3Ssnj	do {
3376813957e3Ssnj		tmp = list_first_entry(requests, struct kgem_request, list);
3377813957e3Ssnj		assert(tmp->ring == rq->ring);
3378813957e3Ssnj		__kgem_retire_rq(kgem, tmp);
3379813957e3Ssnj	} while (tmp != rq);
338063ef14f0Smrg
338163ef14f0Smrg	assert(bo->needs_flush || bo->rq == NULL);
338263ef14f0Smrg	assert(bo->needs_flush || list_is_empty(&bo->request));
338363ef14f0Smrg	assert(bo->needs_flush || bo->domain == DOMAIN_NONE);
338463ef14f0Smrg	return bo->rq;
3385813957e3Ssnj}
3386813957e3Ssnj
33879a906b70Schristos#if 0
33889a906b70Schristosstatic void kgem_commit__check_reloc(struct kgem *kgem)
33899a906b70Schristos{
33909a906b70Schristos	struct kgem_request *rq = kgem->next_request;
33919a906b70Schristos	struct kgem_bo *bo;
33929a906b70Schristos	bool has_64bit = kgem->gen >= 0100;
33939a906b70Schristos	int i;
33949a906b70Schristos
33959a906b70Schristos	for (i = 0; i < kgem->nreloc; i++) {
33969a906b70Schristos		list_for_each_entry(bo, &rq->buffers, request) {
33979a906b70Schristos			if (bo->target_handle == kgem->reloc[i].target_handle) {
33989a906b70Schristos				uint64_t value = 0;
33999a906b70Schristos				gem_read(kgem->fd, rq->bo->handle, &value, kgem->reloc[i].offset, has_64bit ? 8 : 4);
34009a906b70Schristos				assert(bo->exec->offset == -1 || value == bo->exec->offset + (int)kgem->reloc[i].delta);
34019a906b70Schristos				break;
34029a906b70Schristos			}
34039a906b70Schristos		}
34049a906b70Schristos	}
34059a906b70Schristos}
34069a906b70Schristos#else
34079a906b70Schristos#define kgem_commit__check_reloc(kgem)
34089a906b70Schristos#endif
34099a906b70Schristos
34109a906b70Schristos#ifndef NDEBUG
34119a906b70Schristosstatic void kgem_commit__check_buffers(struct kgem *kgem)
34129a906b70Schristos{
34139a906b70Schristos	struct kgem_buffer *bo;
34149a906b70Schristos
34159a906b70Schristos	list_for_each_entry(bo, &kgem->active_buffers, base.list)
34169a906b70Schristos		assert(bo->base.exec == NULL);
34179a906b70Schristos}
34189a906b70Schristos#else
34199a906b70Schristos#define kgem_commit__check_buffers(kgem)
34209a906b70Schristos#endif
34219a906b70Schristos
342203b705cfSriastradhstatic void kgem_commit(struct kgem *kgem)
342303b705cfSriastradh{
342403b705cfSriastradh	struct kgem_request *rq = kgem->next_request;
342503b705cfSriastradh	struct kgem_bo *bo, *next;
342603b705cfSriastradh
34279a906b70Schristos	kgem_commit__check_reloc(kgem);
34289a906b70Schristos
342903b705cfSriastradh	list_for_each_entry_safe(bo, next, &rq->buffers, request) {
343003b705cfSriastradh		assert(next->request.prev == &bo->request);
343103b705cfSriastradh
343203b705cfSriastradh		DBG(("%s: release handle=%d (proxy? %d), dirty? %d flush? %d, snoop? %d -> offset=%x\n",
343303b705cfSriastradh		     __FUNCTION__, bo->handle, bo->proxy != NULL,
343403b705cfSriastradh		     bo->gpu_dirty, bo->needs_flush, bo->snoop,
343503b705cfSriastradh		     (unsigned)bo->exec->offset));
343603b705cfSriastradh
343703b705cfSriastradh		assert(bo->exec);
343803b705cfSriastradh		assert(bo->proxy == NULL || bo->exec == &_kgem_dummy_exec);
343903b705cfSriastradh		assert(RQ(bo->rq) == rq || (RQ(bo->proxy->rq) == rq));
344003b705cfSriastradh
344103b705cfSriastradh		bo->presumed_offset = bo->exec->offset;
344203b705cfSriastradh		bo->exec = NULL;
344303b705cfSriastradh		bo->target_handle = -1;
344403b705cfSriastradh
344503b705cfSriastradh		if (!bo->refcnt && !bo->reusable) {
344603b705cfSriastradh			assert(!bo->snoop);
34479a906b70Schristos			assert(!bo->proxy);
344803b705cfSriastradh			kgem_bo_free(kgem, bo);
344903b705cfSriastradh			continue;
345003b705cfSriastradh		}
345103b705cfSriastradh
345203b705cfSriastradh		bo->binding.offset = 0;
345303b705cfSriastradh		bo->domain = DOMAIN_GPU;
345403b705cfSriastradh		bo->gpu_dirty = false;
345563ef14f0Smrg		bo->gtt_dirty = false;
345603b705cfSriastradh
345703b705cfSriastradh		if (bo->proxy) {
345803b705cfSriastradh			/* proxies are not used for domain tracking */
345903b705cfSriastradh			__kgem_bo_clear_busy(bo);
346003b705cfSriastradh		}
346103b705cfSriastradh
34629a906b70Schristos		kgem->scanout_busy |= bo->scanout && bo->needs_flush;
346303b705cfSriastradh	}
346403b705cfSriastradh
346503b705cfSriastradh	if (rq == &kgem->static_request) {
346603b705cfSriastradh		struct drm_i915_gem_set_domain set_domain;
346703b705cfSriastradh
346803b705cfSriastradh		DBG(("%s: syncing due to allocation failure\n", __FUNCTION__));
346903b705cfSriastradh
347003b705cfSriastradh		VG_CLEAR(set_domain);
347103b705cfSriastradh		set_domain.handle = rq->bo->handle;
347203b705cfSriastradh		set_domain.read_domains = I915_GEM_DOMAIN_GTT;
347303b705cfSriastradh		set_domain.write_domain = I915_GEM_DOMAIN_GTT;
34749a906b70Schristos		if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) {
347503b705cfSriastradh			DBG(("%s: sync: GPU hang detected\n", __FUNCTION__));
347603b705cfSriastradh			kgem_throttle(kgem);
347703b705cfSriastradh		}
347803b705cfSriastradh
347963ef14f0Smrg		while (!list_is_empty(&rq->buffers)) {
348063ef14f0Smrg			bo = list_first_entry(&rq->buffers,
348163ef14f0Smrg					      struct kgem_bo,
348263ef14f0Smrg					      request);
348363ef14f0Smrg
348463ef14f0Smrg			assert(RQ(bo->rq) == rq);
348563ef14f0Smrg			assert(bo->exec == NULL);
348663ef14f0Smrg			assert(bo->domain == DOMAIN_GPU);
348763ef14f0Smrg
348863ef14f0Smrg			list_del(&bo->request);
348963ef14f0Smrg			bo->domain = DOMAIN_NONE;
349063ef14f0Smrg			bo->rq = NULL;
349163ef14f0Smrg
349263ef14f0Smrg			if (bo->refcnt == 0)
349363ef14f0Smrg				_kgem_bo_destroy(kgem, bo);
349463ef14f0Smrg		}
349563ef14f0Smrg
349603b705cfSriastradh		kgem_retire(kgem);
349703b705cfSriastradh		assert(list_is_empty(&rq->buffers));
349803b705cfSriastradh
34999a906b70Schristos		assert(rq->bo->map__gtt == NULL);
3500813957e3Ssnj		assert(rq->bo->map__wc == NULL);
35019a906b70Schristos		assert(rq->bo->map__cpu == NULL);
350203b705cfSriastradh		gem_close(kgem->fd, rq->bo->handle);
350303b705cfSriastradh		kgem_cleanup_cache(kgem);
350403b705cfSriastradh	} else {
350563ef14f0Smrg		assert(rq != (struct kgem_request *)kgem);
35069a906b70Schristos		assert(rq->ring < ARRAY_SIZE(kgem->requests));
350763ef14f0Smrg		assert(rq->bo);
350803b705cfSriastradh		list_add_tail(&rq->list, &kgem->requests[rq->ring]);
350903b705cfSriastradh		kgem->need_throttle = kgem->need_retire = 1;
3510813957e3Ssnj
3511813957e3Ssnj		if (kgem->fence[rq->ring] == NULL &&
3512813957e3Ssnj		    __kgem_busy(kgem, rq->bo->handle))
3513813957e3Ssnj			kgem->fence[rq->ring] = rq;
351403b705cfSriastradh	}
351503b705cfSriastradh
351603b705cfSriastradh	kgem->next_request = NULL;
35179a906b70Schristos
35189a906b70Schristos	kgem_commit__check_buffers(kgem);
351903b705cfSriastradh}
352003b705cfSriastradh
352103b705cfSriastradhstatic void kgem_close_list(struct kgem *kgem, struct list *head)
352203b705cfSriastradh{
352303b705cfSriastradh	while (!list_is_empty(head))
352403b705cfSriastradh		kgem_bo_free(kgem, list_first_entry(head, struct kgem_bo, list));
352503b705cfSriastradh}
352603b705cfSriastradh
352703b705cfSriastradhstatic void kgem_close_inactive(struct kgem *kgem)
352803b705cfSriastradh{
352903b705cfSriastradh	unsigned int i;
353003b705cfSriastradh
353163ef14f0Smrg	for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) {
353203b705cfSriastradh		kgem_close_list(kgem, &kgem->inactive[i]);
353363ef14f0Smrg		assert(list_is_empty(&kgem->inactive[i]));
353463ef14f0Smrg	}
353503b705cfSriastradh}
353603b705cfSriastradh
353703b705cfSriastradhstatic void kgem_finish_buffers(struct kgem *kgem)
353803b705cfSriastradh{
353903b705cfSriastradh	struct kgem_buffer *bo, *next;
354003b705cfSriastradh
354103b705cfSriastradh	list_for_each_entry_safe(bo, next, &kgem->batch_buffers, base.list) {
35429a906b70Schristos		DBG(("%s: buffer handle=%d, used=%d, exec?=%d, write=%d, mmapped=%s, refcnt=%d\n",
354303b705cfSriastradh		     __FUNCTION__, bo->base.handle, bo->used, bo->base.exec!=NULL,
35449a906b70Schristos		     bo->write, bo->mmapped == MMAPPED_CPU ? "cpu" : bo->mmapped == MMAPPED_GTT ? "gtt" : "no",
35459a906b70Schristos		     bo->base.refcnt));
354603b705cfSriastradh
354703b705cfSriastradh		assert(next->base.list.prev == &bo->base.list);
354803b705cfSriastradh		assert(bo->base.io);
354903b705cfSriastradh		assert(bo->base.refcnt >= 1);
355003b705cfSriastradh
35519a906b70Schristos		if (bo->base.refcnt > 1 && !bo->base.exec) {
35529a906b70Schristos			DBG(("%s: skipping unattached handle=%d, used=%d, refcnt=%d\n",
35539a906b70Schristos			     __FUNCTION__, bo->base.handle, bo->used, bo->base.refcnt));
355403b705cfSriastradh			continue;
355503b705cfSriastradh		}
355603b705cfSriastradh
355703b705cfSriastradh		if (!bo->write) {
355803b705cfSriastradh			assert(bo->base.exec || bo->base.refcnt > 1);
355903b705cfSriastradh			goto decouple;
356003b705cfSriastradh		}
356103b705cfSriastradh
356203b705cfSriastradh		if (bo->mmapped) {
35639a906b70Schristos			uint32_t used;
356403b705cfSriastradh
356503b705cfSriastradh			assert(!bo->need_io);
356603b705cfSriastradh
356703b705cfSriastradh			used = ALIGN(bo->used, PAGE_SIZE);
356803b705cfSriastradh			if (!DBG_NO_UPLOAD_ACTIVE &&
356903b705cfSriastradh			    used + PAGE_SIZE <= bytes(&bo->base) &&
35709a906b70Schristos			    (kgem->has_llc || bo->mmapped == MMAPPED_GTT || bo->base.snoop)) {
35719a906b70Schristos				DBG(("%s: retaining upload buffer (%d/%d): used=%d, refcnt=%d\n",
35729a906b70Schristos				     __FUNCTION__, bo->used, bytes(&bo->base), used, bo->base.refcnt));
357303b705cfSriastradh				bo->used = used;
357403b705cfSriastradh				list_move(&bo->base.list,
357503b705cfSriastradh					  &kgem->active_buffers);
35769a906b70Schristos				kgem->need_retire = true;
357703b705cfSriastradh				continue;
357803b705cfSriastradh			}
357903b705cfSriastradh			DBG(("%s: discarding mmapped buffer, used=%d, map type=%d\n",
35809a906b70Schristos			     __FUNCTION__, bo->used, bo->mmapped));
358103b705cfSriastradh			goto decouple;
358203b705cfSriastradh		}
358303b705cfSriastradh
35849a906b70Schristos		if (!bo->used || !bo->base.exec) {
358503b705cfSriastradh			/* Unless we replace the handle in the execbuffer,
358603b705cfSriastradh			 * then this bo will become active. So decouple it
358703b705cfSriastradh			 * from the buffer list and track it in the normal
358803b705cfSriastradh			 * manner.
358903b705cfSriastradh			 */
359003b705cfSriastradh			goto decouple;
359103b705cfSriastradh		}
359203b705cfSriastradh
359303b705cfSriastradh		assert(bo->need_io);
359403b705cfSriastradh		assert(bo->base.rq == MAKE_REQUEST(kgem->next_request, kgem->ring));
359503b705cfSriastradh		assert(bo->base.domain != DOMAIN_GPU);
359603b705cfSriastradh
359703b705cfSriastradh		if (bo->base.refcnt == 1 &&
359803b705cfSriastradh		    bo->base.size.pages.count > 1 &&
359903b705cfSriastradh		    bo->used < bytes(&bo->base) / 2) {
360003b705cfSriastradh			struct kgem_bo *shrink;
360103b705cfSriastradh			unsigned alloc = NUM_PAGES(bo->used);
360203b705cfSriastradh
360303b705cfSriastradh			shrink = search_snoop_cache(kgem, alloc,
360403b705cfSriastradh						    CREATE_INACTIVE | CREATE_NO_RETIRE);
360503b705cfSriastradh			if (shrink) {
360603b705cfSriastradh				void *map;
360703b705cfSriastradh				int n;
360803b705cfSriastradh
360903b705cfSriastradh				DBG(("%s: used=%d, shrinking %d to %d, handle %d to %d\n",
361003b705cfSriastradh				     __FUNCTION__,
361103b705cfSriastradh				     bo->used, bytes(&bo->base), bytes(shrink),
361203b705cfSriastradh				     bo->base.handle, shrink->handle));
361303b705cfSriastradh
361403b705cfSriastradh				assert(bo->used <= bytes(shrink));
361503b705cfSriastradh				map = kgem_bo_map__cpu(kgem, shrink);
361603b705cfSriastradh				if (map) {
361703b705cfSriastradh					memcpy(map, bo->mem, bo->used);
361803b705cfSriastradh
361903b705cfSriastradh					shrink->target_handle =
362003b705cfSriastradh						kgem->has_handle_lut ? bo->base.target_handle : shrink->handle;
362103b705cfSriastradh					for (n = 0; n < kgem->nreloc; n++) {
362203b705cfSriastradh						if (kgem->reloc[n].target_handle == bo->base.target_handle) {
362363ef14f0Smrg							uint64_t addr = (int)kgem->reloc[n].delta + shrink->presumed_offset;
362463ef14f0Smrg							kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0])] = addr;
362563ef14f0Smrg							if (kgem->gen >= 0100)
362663ef14f0Smrg								kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0]) + 1] = addr >> 32;
362763ef14f0Smrg
362803b705cfSriastradh							kgem->reloc[n].target_handle = shrink->target_handle;
362903b705cfSriastradh							kgem->reloc[n].presumed_offset = shrink->presumed_offset;
363003b705cfSriastradh						}
363103b705cfSriastradh					}
363203b705cfSriastradh
363303b705cfSriastradh					bo->base.exec->handle = shrink->handle;
363403b705cfSriastradh					bo->base.exec->offset = shrink->presumed_offset;
363503b705cfSriastradh					shrink->exec = bo->base.exec;
363603b705cfSriastradh					shrink->rq = bo->base.rq;
363703b705cfSriastradh					list_replace(&bo->base.request,
363803b705cfSriastradh						     &shrink->request);
363903b705cfSriastradh					list_init(&bo->base.request);
364003b705cfSriastradh					shrink->needs_flush = bo->base.gpu_dirty;
364103b705cfSriastradh
364203b705cfSriastradh					bo->base.exec = NULL;
364303b705cfSriastradh					bo->base.rq = NULL;
364403b705cfSriastradh					bo->base.gpu_dirty = false;
364503b705cfSriastradh					bo->base.needs_flush = false;
364603b705cfSriastradh					bo->used = 0;
364703b705cfSriastradh
364803b705cfSriastradh					goto decouple;
364903b705cfSriastradh				}
365003b705cfSriastradh
365103b705cfSriastradh				__kgem_bo_destroy(kgem, shrink);
365203b705cfSriastradh			}
365303b705cfSriastradh
365403b705cfSriastradh			shrink = search_linear_cache(kgem, alloc,
365503b705cfSriastradh						     CREATE_INACTIVE | CREATE_NO_RETIRE);
365603b705cfSriastradh			if (shrink) {
365703b705cfSriastradh				int n;
365803b705cfSriastradh
365903b705cfSriastradh				DBG(("%s: used=%d, shrinking %d to %d, handle %d to %d\n",
366003b705cfSriastradh				     __FUNCTION__,
366103b705cfSriastradh				     bo->used, bytes(&bo->base), bytes(shrink),
366203b705cfSriastradh				     bo->base.handle, shrink->handle));
366303b705cfSriastradh
366403b705cfSriastradh				assert(bo->used <= bytes(shrink));
36659a906b70Schristos				if (gem_write__cachealigned(kgem->fd, shrink->handle,
36669a906b70Schristos							    0, bo->used, bo->mem) == 0) {
366703b705cfSriastradh					shrink->target_handle =
366803b705cfSriastradh						kgem->has_handle_lut ? bo->base.target_handle : shrink->handle;
366903b705cfSriastradh					for (n = 0; n < kgem->nreloc; n++) {
367003b705cfSriastradh						if (kgem->reloc[n].target_handle == bo->base.target_handle) {
367163ef14f0Smrg							uint64_t addr = (int)kgem->reloc[n].delta + shrink->presumed_offset;
367263ef14f0Smrg							kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0])] = addr;
367363ef14f0Smrg							if (kgem->gen >= 0100)
367463ef14f0Smrg								kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0]) + 1] = addr >> 32;
367563ef14f0Smrg
367603b705cfSriastradh							kgem->reloc[n].target_handle = shrink->target_handle;
367703b705cfSriastradh							kgem->reloc[n].presumed_offset = shrink->presumed_offset;
367803b705cfSriastradh						}
367903b705cfSriastradh					}
368003b705cfSriastradh
368103b705cfSriastradh					bo->base.exec->handle = shrink->handle;
368203b705cfSriastradh					bo->base.exec->offset = shrink->presumed_offset;
368303b705cfSriastradh					shrink->exec = bo->base.exec;
368403b705cfSriastradh					shrink->rq = bo->base.rq;
368503b705cfSriastradh					list_replace(&bo->base.request,
368603b705cfSriastradh						     &shrink->request);
368703b705cfSriastradh					list_init(&bo->base.request);
368803b705cfSriastradh					shrink->needs_flush = bo->base.gpu_dirty;
368903b705cfSriastradh
369003b705cfSriastradh					bo->base.exec = NULL;
369103b705cfSriastradh					bo->base.rq = NULL;
369203b705cfSriastradh					bo->base.gpu_dirty = false;
369303b705cfSriastradh					bo->base.needs_flush = false;
369403b705cfSriastradh					bo->used = 0;
369503b705cfSriastradh
369603b705cfSriastradh					goto decouple;
369703b705cfSriastradh				}
369803b705cfSriastradh
369903b705cfSriastradh				__kgem_bo_destroy(kgem, shrink);
370003b705cfSriastradh			}
370103b705cfSriastradh		}
370203b705cfSriastradh
370303b705cfSriastradh		DBG(("%s: handle=%d, uploading %d/%d\n",
370403b705cfSriastradh		     __FUNCTION__, bo->base.handle, bo->used, bytes(&bo->base)));
370503b705cfSriastradh		ASSERT_IDLE(kgem, bo->base.handle);
370603b705cfSriastradh		assert(bo->used <= bytes(&bo->base));
37079a906b70Schristos		gem_write__cachealigned(kgem->fd, bo->base.handle,
37089a906b70Schristos					0, bo->used, bo->mem);
370903b705cfSriastradh		bo->need_io = 0;
371003b705cfSriastradh
371103b705cfSriastradhdecouple:
371203b705cfSriastradh		DBG(("%s: releasing handle=%d\n",
371303b705cfSriastradh		     __FUNCTION__, bo->base.handle));
371403b705cfSriastradh		list_del(&bo->base.list);
371503b705cfSriastradh		kgem_bo_unref(kgem, &bo->base);
371603b705cfSriastradh	}
371703b705cfSriastradh}
371803b705cfSriastradh
371903b705cfSriastradhstatic void kgem_cleanup(struct kgem *kgem)
372003b705cfSriastradh{
372103b705cfSriastradh	int n;
372203b705cfSriastradh
372303b705cfSriastradh	for (n = 0; n < ARRAY_SIZE(kgem->requests); n++) {
372403b705cfSriastradh		while (!list_is_empty(&kgem->requests[n])) {
372503b705cfSriastradh			struct kgem_request *rq;
372603b705cfSriastradh
372703b705cfSriastradh			rq = list_first_entry(&kgem->requests[n],
372803b705cfSriastradh					      struct kgem_request,
372903b705cfSriastradh					      list);
37309a906b70Schristos			assert(rq->ring == n);
373103b705cfSriastradh			while (!list_is_empty(&rq->buffers)) {
373203b705cfSriastradh				struct kgem_bo *bo;
373303b705cfSriastradh
373403b705cfSriastradh				bo = list_first_entry(&rq->buffers,
373503b705cfSriastradh						      struct kgem_bo,
373603b705cfSriastradh						      request);
373703b705cfSriastradh
373803b705cfSriastradh				bo->exec = NULL;
373903b705cfSriastradh				bo->gpu_dirty = false;
374003b705cfSriastradh				__kgem_bo_clear_busy(bo);
374103b705cfSriastradh				if (bo->refcnt == 0)
374203b705cfSriastradh					kgem_bo_free(kgem, bo);
374303b705cfSriastradh			}
374403b705cfSriastradh
374563ef14f0Smrg			if (--rq->bo->refcnt == 0)
374663ef14f0Smrg				kgem_bo_free(kgem, rq->bo);
374763ef14f0Smrg
374803b705cfSriastradh			__kgem_request_free(rq);
374903b705cfSriastradh		}
375003b705cfSriastradh	}
375103b705cfSriastradh
375203b705cfSriastradh	kgem_close_inactive(kgem);
375303b705cfSriastradh}
375403b705cfSriastradh
3755813957e3Ssnjstatic int
3756813957e3Ssnjkgem_batch_write(struct kgem *kgem,
3757813957e3Ssnj		 struct kgem_bo *bo,
3758813957e3Ssnj		 uint32_t size)
375903b705cfSriastradh{
3760813957e3Ssnj	char *ptr;
376103b705cfSriastradh	int ret;
376203b705cfSriastradh
376363ef14f0Smrg	assert(bo->exec == NULL);
376463ef14f0Smrg	assert(bo->rq == NULL);
376563ef14f0Smrg	assert(!__kgem_busy(kgem, bo->handle));
376603b705cfSriastradh
37679a906b70Schristos#if DBG_NO_EXEC
37689a906b70Schristos	{
37699a906b70Schristos		uint32_t batch[] = { MI_BATCH_BUFFER_END, 0};
3770813957e3Ssnj		return gem_write(kgem->fd, bo->handle, 0, sizeof(batch), batch);
37719a906b70Schristos	}
37729a906b70Schristos#endif
37739a906b70Schristos
3774813957e3Ssnj	assert(!bo->scanout);
37759a906b70Schristosretry:
3776813957e3Ssnj	ptr = NULL;
3777813957e3Ssnj	if (bo->domain == DOMAIN_CPU || kgem->has_llc) {
3778813957e3Ssnj		ptr = bo->map__cpu;
3779813957e3Ssnj		if (ptr == NULL)
3780813957e3Ssnj			ptr = __kgem_bo_map__cpu(kgem, bo);
3781813957e3Ssnj	} else if (kgem->has_wc_mmap) {
3782813957e3Ssnj		ptr = bo->map__wc;
3783813957e3Ssnj		if (ptr == NULL)
3784813957e3Ssnj			ptr = __kgem_bo_map__wc(kgem, bo);
3785813957e3Ssnj	}
3786813957e3Ssnj	if (ptr) {
3787813957e3Ssnj		memcpy(ptr, kgem->batch, sizeof(uint32_t)*kgem->nbatch);
3788813957e3Ssnj		if (kgem->surface != kgem->batch_size) {
3789813957e3Ssnj			ret = PAGE_ALIGN(sizeof(uint32_t) * kgem->batch_size);
3790813957e3Ssnj			ret -= sizeof(uint32_t) * kgem->surface;
3791813957e3Ssnj			ptr += size - ret;
3792813957e3Ssnj			memcpy(ptr, kgem->batch + kgem->surface,
3793813957e3Ssnj			       (kgem->batch_size - kgem->surface)*sizeof(uint32_t));
3794813957e3Ssnj		}
3795813957e3Ssnj		return 0;
3796813957e3Ssnj	}
3797813957e3Ssnj
379803b705cfSriastradh	/* If there is no surface data, just upload the batch */
37999a906b70Schristos	if (kgem->surface == kgem->batch_size) {
3800813957e3Ssnj		if ((ret = gem_write__cachealigned(kgem->fd, bo->handle,
38019a906b70Schristos						   0, sizeof(uint32_t)*kgem->nbatch,
38029a906b70Schristos						   kgem->batch)) == 0)
38039a906b70Schristos			return 0;
38049a906b70Schristos
38059a906b70Schristos		goto expire;
38069a906b70Schristos	}
380703b705cfSriastradh
380803b705cfSriastradh	/* Are the batch pages conjoint with the surface pages? */
380903b705cfSriastradh	if (kgem->surface < kgem->nbatch + PAGE_SIZE/sizeof(uint32_t)) {
381003b705cfSriastradh		assert(size == PAGE_ALIGN(kgem->batch_size*sizeof(uint32_t)));
3811813957e3Ssnj		if ((ret = gem_write__cachealigned(kgem->fd, bo->handle,
38129a906b70Schristos						   0, kgem->batch_size*sizeof(uint32_t),
38139a906b70Schristos						   kgem->batch)) == 0)
38149a906b70Schristos			return 0;
38159a906b70Schristos
38169a906b70Schristos		goto expire;
381703b705cfSriastradh	}
381803b705cfSriastradh
381903b705cfSriastradh	/* Disjoint surface/batch, upload separately */
3820813957e3Ssnj	if ((ret = gem_write__cachealigned(kgem->fd, bo->handle,
38219a906b70Schristos					   0, sizeof(uint32_t)*kgem->nbatch,
38229a906b70Schristos					   kgem->batch)))
38239a906b70Schristos		goto expire;
382403b705cfSriastradh
382503b705cfSriastradh	ret = PAGE_ALIGN(sizeof(uint32_t) * kgem->batch_size);
382603b705cfSriastradh	ret -= sizeof(uint32_t) * kgem->surface;
382703b705cfSriastradh	assert(size-ret >= kgem->nbatch*sizeof(uint32_t));
3828813957e3Ssnj	if (gem_write(kgem->fd, bo->handle,
38299a906b70Schristos		      size - ret, (kgem->batch_size - kgem->surface)*sizeof(uint32_t),
38309a906b70Schristos		      kgem->batch + kgem->surface))
38319a906b70Schristos		goto expire;
38329a906b70Schristos
38339a906b70Schristos	return 0;
38349a906b70Schristos
38359a906b70Schristosexpire:
38369a906b70Schristos	assert(ret != EINVAL);
38379a906b70Schristos
38389a906b70Schristos	(void)__kgem_throttle_retire(kgem, 0);
38399a906b70Schristos	if (kgem_expire_cache(kgem))
38409a906b70Schristos		goto retry;
38419a906b70Schristos
38429a906b70Schristos	if (kgem_cleanup_cache(kgem))
38439a906b70Schristos		goto retry;
38449a906b70Schristos
38459a906b70Schristos	ERR(("%s: failed to write batch (handle=%d): %d\n",
3846813957e3Ssnj	     __FUNCTION__, bo->handle, -ret));
38479a906b70Schristos	return ret;
384803b705cfSriastradh}
384903b705cfSriastradh
385003b705cfSriastradhvoid kgem_reset(struct kgem *kgem)
385103b705cfSriastradh{
385203b705cfSriastradh	if (kgem->next_request) {
385303b705cfSriastradh		struct kgem_request *rq = kgem->next_request;
385403b705cfSriastradh
385503b705cfSriastradh		while (!list_is_empty(&rq->buffers)) {
385603b705cfSriastradh			struct kgem_bo *bo =
385703b705cfSriastradh				list_first_entry(&rq->buffers,
385803b705cfSriastradh						 struct kgem_bo,
385903b705cfSriastradh						 request);
386003b705cfSriastradh			list_del(&bo->request);
386103b705cfSriastradh
386203b705cfSriastradh			assert(RQ(bo->rq) == rq);
386303b705cfSriastradh
386403b705cfSriastradh			bo->binding.offset = 0;
386503b705cfSriastradh			bo->exec = NULL;
386603b705cfSriastradh			bo->target_handle = -1;
386703b705cfSriastradh			bo->gpu_dirty = false;
386803b705cfSriastradh
386903b705cfSriastradh			if (bo->needs_flush && __kgem_busy(kgem, bo->handle)) {
387003b705cfSriastradh				assert(bo->domain == DOMAIN_GPU || bo->domain == DOMAIN_NONE);
387103b705cfSriastradh				list_add(&bo->request, &kgem->flushing);
387203b705cfSriastradh				bo->rq = (void *)kgem;
38739a906b70Schristos				kgem->need_retire = true;
387403b705cfSriastradh			} else
387503b705cfSriastradh				__kgem_bo_clear_busy(bo);
387603b705cfSriastradh
387703b705cfSriastradh			if (bo->refcnt || bo->rq)
387803b705cfSriastradh				continue;
387903b705cfSriastradh
38809a906b70Schristos			kgem_bo_move_to_cache(kgem, bo);
388103b705cfSriastradh		}
388203b705cfSriastradh
388303b705cfSriastradh		if (rq != &kgem->static_request) {
388403b705cfSriastradh			list_init(&rq->list);
388503b705cfSriastradh			__kgem_request_free(rq);
388603b705cfSriastradh		}
388703b705cfSriastradh	}
388803b705cfSriastradh
388903b705cfSriastradh	kgem->nfence = 0;
389003b705cfSriastradh	kgem->nexec = 0;
389103b705cfSriastradh	kgem->nreloc = 0;
389203b705cfSriastradh	kgem->nreloc__self = 0;
389303b705cfSriastradh	kgem->aperture = 0;
389403b705cfSriastradh	kgem->aperture_fenced = 0;
38959a906b70Schristos	kgem->aperture_max_fence = 0;
389603b705cfSriastradh	kgem->nbatch = 0;
389703b705cfSriastradh	kgem->surface = kgem->batch_size;
389803b705cfSriastradh	kgem->mode = KGEM_NONE;
38999a906b70Schristos	kgem->needs_semaphore = false;
39009a906b70Schristos	kgem->needs_reservation = false;
390103b705cfSriastradh	kgem->flush = 0;
390203b705cfSriastradh	kgem->batch_flags = kgem->batch_flags_base;
3903813957e3Ssnj	assert(kgem->batch);
390403b705cfSriastradh
390503b705cfSriastradh	kgem->next_request = __kgem_request_alloc(kgem);
390603b705cfSriastradh
390703b705cfSriastradh	kgem_sna_reset(kgem);
390803b705cfSriastradh}
390903b705cfSriastradh
3910813957e3Ssnjstatic int compact_batch_surface(struct kgem *kgem, int *shrink)
391103b705cfSriastradh{
3912813957e3Ssnj	int size, n;
391303b705cfSriastradh
391403b705cfSriastradh	if (!kgem->has_relaxed_delta)
39159a906b70Schristos		return kgem->batch_size * sizeof(uint32_t);
391603b705cfSriastradh
391703b705cfSriastradh	/* See if we can pack the contents into one or two pages */
391803b705cfSriastradh	n = ALIGN(kgem->batch_size, 1024);
391903b705cfSriastradh	size = n - kgem->surface + kgem->nbatch;
392003b705cfSriastradh	size = ALIGN(size, 1024);
392103b705cfSriastradh
3922813957e3Ssnj	*shrink = (n - size) * sizeof(uint32_t);
392303b705cfSriastradh	return size * sizeof(uint32_t);
392403b705cfSriastradh}
392503b705cfSriastradh
392663ef14f0Smrgstatic struct kgem_bo *first_available(struct kgem *kgem, struct list *list)
392763ef14f0Smrg{
392863ef14f0Smrg	struct kgem_bo *bo;
392963ef14f0Smrg
393063ef14f0Smrg	list_for_each_entry(bo, list, list) {
393163ef14f0Smrg		assert(bo->refcnt > 0);
393263ef14f0Smrg
393363ef14f0Smrg		if (bo->rq) {
393463ef14f0Smrg			assert(RQ(bo->rq)->bo == bo);
393563ef14f0Smrg			if (__kgem_busy(kgem, bo->handle))
393663ef14f0Smrg				break;
393763ef14f0Smrg
393863ef14f0Smrg			__kgem_retire_rq(kgem, RQ(bo->rq));
393963ef14f0Smrg			assert(bo->rq == NULL);
394063ef14f0Smrg		}
394163ef14f0Smrg
394263ef14f0Smrg		if (bo->refcnt > 1)
394363ef14f0Smrg			continue;
394463ef14f0Smrg
394563ef14f0Smrg		list_move_tail(&bo->list, list);
394663ef14f0Smrg		return kgem_bo_reference(bo);
394763ef14f0Smrg	}
394863ef14f0Smrg
394963ef14f0Smrg	return NULL;
395063ef14f0Smrg}
395163ef14f0Smrg
395203b705cfSriastradhstatic struct kgem_bo *
3953813957e3Ssnjkgem_create_batch(struct kgem *kgem)
395403b705cfSriastradh{
395503b705cfSriastradh	struct kgem_bo *bo;
395663ef14f0Smrg	int size, shrink = 0;
3957813957e3Ssnj
395863ef14f0Smrg#if !DBG_NO_SHRINK_BATCHES
3959813957e3Ssnj	if (kgem->surface != kgem->batch_size)
3960813957e3Ssnj		size = compact_batch_surface(kgem, &shrink);
3961813957e3Ssnj	else
3962813957e3Ssnj		size = kgem->nbatch * sizeof(uint32_t);
396303b705cfSriastradh
396403b705cfSriastradh	if (size <= 4096) {
396563ef14f0Smrg		bo = first_available(kgem, &kgem->pinned_batches[0]);
396663ef14f0Smrg		if (bo)
3967813957e3Ssnj			goto write;
396863ef14f0Smrg	}
396903b705cfSriastradh
397063ef14f0Smrg	if (size <= 16384) {
397163ef14f0Smrg		bo = first_available(kgem, &kgem->pinned_batches[1]);
397263ef14f0Smrg		if (bo)
397363ef14f0Smrg			goto write;
397403b705cfSriastradh	}
397503b705cfSriastradh
39769a906b70Schristos	if (kgem->gen == 020) {
39779a906b70Schristos		bo = kgem_create_linear(kgem, size, CREATE_CACHED | CREATE_TEMPORARY);
39789a906b70Schristos		if (bo)
3979813957e3Ssnj			goto write;
398003b705cfSriastradh
39819a906b70Schristos		/* Nothing available for reuse, rely on the kernel wa */
39829a906b70Schristos		if (kgem->has_pinned_batches) {
39839a906b70Schristos			bo = kgem_create_linear(kgem, size, CREATE_CACHED | CREATE_TEMPORARY);
39849a906b70Schristos			if (bo) {
39859a906b70Schristos				kgem->batch_flags &= ~LOCAL_I915_EXEC_IS_PINNED;
3986813957e3Ssnj				goto write;
39879a906b70Schristos			}
39889a906b70Schristos		}
39899a906b70Schristos
39909a906b70Schristos		if (size < 16384) {
39919a906b70Schristos			bo = list_first_entry(&kgem->pinned_batches[size > 4096],
39929a906b70Schristos					      struct kgem_bo,
39939a906b70Schristos					      list);
39949a906b70Schristos			list_move_tail(&bo->list, &kgem->pinned_batches[size > 4096]);
399503b705cfSriastradh
39969a906b70Schristos			DBG(("%s: syncing due to busy batches\n", __FUNCTION__));
399763ef14f0Smrg			if (kgem_bo_wait(kgem, bo))
39989a906b70Schristos				return NULL;
399903b705cfSriastradh
40009a906b70Schristos			kgem_retire(kgem);
40019a906b70Schristos			assert(bo->rq == NULL);
4002813957e3Ssnj			bo = kgem_bo_reference(bo);
4003813957e3Ssnj			goto write;
40049a906b70Schristos		}
400503b705cfSriastradh	}
400663ef14f0Smrg#else
400763ef14f0Smrg	if (kgem->surface != kgem->batch_size)
400863ef14f0Smrg		size = kgem->batch_size * sizeof(uint32_t);
400963ef14f0Smrg	else
401063ef14f0Smrg		size = kgem->nbatch * sizeof(uint32_t);
401163ef14f0Smrg#endif
401203b705cfSriastradh
401363ef14f0Smrg	if (!kgem->batch_bo || !kgem->has_llc) {
4014813957e3Ssnj		bo = kgem_create_linear(kgem, size, CREATE_NO_THROTTLE);
4015813957e3Ssnj		if (bo) {
4016813957e3Ssnjwrite:
4017813957e3Ssnj			kgem_fixup_relocs(kgem, bo, shrink);
4018813957e3Ssnj			if (kgem_batch_write(kgem, bo, size)) {
4019813957e3Ssnj				kgem_bo_destroy(kgem, bo);
4020813957e3Ssnj				return NULL;
4021813957e3Ssnj			}
402263ef14f0Smrg			return bo;
4023813957e3Ssnj		}
4024813957e3Ssnj	}
402563ef14f0Smrg
4026813957e3Ssnj	return kgem_new_batch(kgem);
402703b705cfSriastradh}
402803b705cfSriastradh
40299a906b70Schristos#if !NDEBUG
40309a906b70Schristosstatic bool dump_file(const char *path)
40319a906b70Schristos{
40329a906b70Schristos	FILE *file;
40339a906b70Schristos	size_t len = 0;
40349a906b70Schristos	char *line = NULL;
40359a906b70Schristos
40369a906b70Schristos	file = fopen(path, "r");
40379a906b70Schristos	if (file == NULL)
40389a906b70Schristos		return false;
40399a906b70Schristos
40409a906b70Schristos	while (getline(&line, &len, file) != -1)
40419a906b70Schristos		ErrorF("%s", line);
40429a906b70Schristos
40439a906b70Schristos	free(line);
40449a906b70Schristos	fclose(file);
40459a906b70Schristos	return true;
40469a906b70Schristos}
40479a906b70Schristos
40489a906b70Schristosstatic void dump_debugfs(struct kgem *kgem, const char *name)
40499a906b70Schristos{
40509a906b70Schristos	char path[80];
40519a906b70Schristos	int minor = kgem_get_minor(kgem);
40529a906b70Schristos
40539a906b70Schristos	if (minor < 0)
40549a906b70Schristos		return;
40559a906b70Schristos
40569a906b70Schristos	sprintf(path, "/sys/kernel/debug/dri/%d/%s", minor, name);
40579a906b70Schristos	if (dump_file(path))
40589a906b70Schristos		return;
40599a906b70Schristos
40609a906b70Schristos	sprintf(path, "/debug/dri/%d/%s", minor, name);
40619a906b70Schristos	if (dump_file(path))
40629a906b70Schristos		return;
40639a906b70Schristos}
40649a906b70Schristos
40659a906b70Schristosstatic void dump_gtt_info(struct kgem *kgem)
40669a906b70Schristos{
40679a906b70Schristos	dump_debugfs(kgem, "i915_gem_gtt");
40689a906b70Schristos}
40699a906b70Schristos
40709a906b70Schristosstatic void dump_fence_regs(struct kgem *kgem)
40719a906b70Schristos{
40729a906b70Schristos	dump_debugfs(kgem, "i915_gem_fence_regs");
40739a906b70Schristos}
40749a906b70Schristos#endif
40759a906b70Schristos
40769a906b70Schristosstatic int do_execbuf(struct kgem *kgem, struct drm_i915_gem_execbuffer2 *execbuf)
40779a906b70Schristos{
407863ef14f0Smrg	int ret;
40799a906b70Schristos
40809a906b70Schristosretry:
40819a906b70Schristos	ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_EXECBUFFER2, execbuf);
40829a906b70Schristos	if (ret == 0)
40839a906b70Schristos		return 0;
40849a906b70Schristos
40859a906b70Schristos	DBG(("%s: failed ret=%d, throttling and discarding cache\n", __FUNCTION__, ret));
40869a906b70Schristos	(void)__kgem_throttle_retire(kgem, 0);
40879a906b70Schristos	if (kgem_expire_cache(kgem))
40889a906b70Schristos		goto retry;
40899a906b70Schristos
40909a906b70Schristos	if (kgem_cleanup_cache(kgem))
40919a906b70Schristos		goto retry;
40929a906b70Schristos
40939a906b70Schristos	/* last gasp */
4094813957e3Ssnj	ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_EXECBUFFER2, execbuf);
409563ef14f0Smrg	if (ret != -ENOSPC)
409663ef14f0Smrg		return ret;
409763ef14f0Smrg
409863ef14f0Smrg	/* One final trick up our sleeve for when we run out of space.
409963ef14f0Smrg	 * We turn everything off to free up our pinned framebuffers,
410063ef14f0Smrg	 * sprites and cursors, and try just one more time.
410163ef14f0Smrg	 */
4102813957e3Ssnj
4103813957e3Ssnj	xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING,
4104813957e3Ssnj		   "Failed to submit rendering commands, trying again with outputs disabled.\n");
4105813957e3Ssnj
410663ef14f0Smrg	if (sna_mode_disable(__to_sna(kgem))) {
4107813957e3Ssnj		kgem_cleanup_cache(kgem);
4108813957e3Ssnj		ret = do_ioctl(kgem->fd,
4109813957e3Ssnj			       DRM_IOCTL_I915_GEM_EXECBUFFER2,
4110813957e3Ssnj			       execbuf);
4111813957e3Ssnj		DBG(("%s: last_gasp ret=%d\n", __FUNCTION__, ret));
411263ef14f0Smrg		sna_mode_enable(__to_sna(kgem));
4113813957e3Ssnj	}
4114813957e3Ssnj
4115813957e3Ssnj	return ret;
41169a906b70Schristos}
41179a906b70Schristos
411803b705cfSriastradhvoid _kgem_submit(struct kgem *kgem)
411903b705cfSriastradh{
412003b705cfSriastradh	struct kgem_request *rq;
412103b705cfSriastradh	uint32_t batch_end;
412263ef14f0Smrg	int i, ret;
412303b705cfSriastradh
412403b705cfSriastradh	assert(!DBG_NO_HW);
412503b705cfSriastradh	assert(!kgem->wedged);
412603b705cfSriastradh
412703b705cfSriastradh	assert(kgem->nbatch);
412803b705cfSriastradh	assert(kgem->nbatch <= KGEM_BATCH_SIZE(kgem));
412903b705cfSriastradh	assert(kgem->nbatch <= kgem->surface);
413003b705cfSriastradh
413103b705cfSriastradh	batch_end = kgem_end_batch(kgem);
413203b705cfSriastradh	kgem_sna_flush(kgem);
413303b705cfSriastradh
41349a906b70Schristos	DBG(("batch[%d/%d, flags=%x]: %d %d %d %d, nreloc=%d, nexec=%d, nfence=%d, aperture=%d [fenced=%d]\n",
41359a906b70Schristos	     kgem->mode, kgem->ring, kgem->batch_flags,
41369a906b70Schristos	     batch_end, kgem->nbatch, kgem->surface, kgem->batch_size,
41379a906b70Schristos	     kgem->nreloc, kgem->nexec, kgem->nfence, kgem->aperture, kgem->aperture_fenced));
413803b705cfSriastradh
413903b705cfSriastradh	assert(kgem->nbatch <= kgem->batch_size);
414003b705cfSriastradh	assert(kgem->nbatch <= kgem->surface);
414103b705cfSriastradh	assert(kgem->nreloc <= ARRAY_SIZE(kgem->reloc));
414203b705cfSriastradh	assert(kgem->nexec < ARRAY_SIZE(kgem->exec));
414303b705cfSriastradh	assert(kgem->nfence <= kgem->fence_max);
414403b705cfSriastradh
414503b705cfSriastradh	kgem_finish_buffers(kgem);
414603b705cfSriastradh
41479a906b70Schristos#if SHOW_BATCH_BEFORE
414803b705cfSriastradh	__kgem_batch_debug(kgem, batch_end);
414903b705cfSriastradh#endif
415003b705cfSriastradh
415103b705cfSriastradh	rq = kgem->next_request;
4152813957e3Ssnj	assert(rq->bo == NULL);
4153813957e3Ssnj
4154813957e3Ssnj	rq->bo = kgem_create_batch(kgem);
415503b705cfSriastradh	if (rq->bo) {
4156813957e3Ssnj		struct drm_i915_gem_execbuffer2 execbuf;
415703b705cfSriastradh
415803b705cfSriastradh		assert(!rq->bo->needs_flush);
415903b705cfSriastradh
416003b705cfSriastradh		i = kgem->nexec++;
4161813957e3Ssnj		kgem->exec[i].handle = rq->bo->handle;
416203b705cfSriastradh		kgem->exec[i].relocation_count = kgem->nreloc;
416303b705cfSriastradh		kgem->exec[i].relocs_ptr = (uintptr_t)kgem->reloc;
416403b705cfSriastradh		kgem->exec[i].alignment = 0;
416503b705cfSriastradh		kgem->exec[i].offset = rq->bo->presumed_offset;
416663ef14f0Smrg		/* Make sure the kernel releases any fence, ignored if gen4+ */
416763ef14f0Smrg		kgem->exec[i].flags = EXEC_OBJECT_NEEDS_FENCE;
416803b705cfSriastradh		kgem->exec[i].rsvd1 = 0;
416903b705cfSriastradh		kgem->exec[i].rsvd2 = 0;
417003b705cfSriastradh
417103b705cfSriastradh		rq->bo->exec = &kgem->exec[i];
417203b705cfSriastradh		rq->bo->rq = MAKE_REQUEST(rq, kgem->ring); /* useful sanity check */
417303b705cfSriastradh		list_add(&rq->bo->request, &rq->buffers);
417403b705cfSriastradh		rq->ring = kgem->ring == KGEM_BLT;
417503b705cfSriastradh
4176813957e3Ssnj		memset(&execbuf, 0, sizeof(execbuf));
4177813957e3Ssnj		execbuf.buffers_ptr = (uintptr_t)kgem->exec;
4178813957e3Ssnj		execbuf.buffer_count = kgem->nexec;
417963ef14f0Smrg		if (kgem->gen < 030)
418063ef14f0Smrg			execbuf.batch_len = batch_end*sizeof(uint32_t);
4181813957e3Ssnj		execbuf.flags = kgem->ring | kgem->batch_flags;
4182813957e3Ssnj
4183813957e3Ssnj		if (DBG_DUMP) {
4184813957e3Ssnj			int fd = open("/tmp/i915-batchbuffers.dump",
4185813957e3Ssnj				      O_WRONLY | O_CREAT | O_APPEND,
4186813957e3Ssnj				      0666);
4187813957e3Ssnj			if (fd != -1) {
4188813957e3Ssnj				ret = write(fd, kgem->batch, batch_end*sizeof(uint32_t));
4189813957e3Ssnj				fd = close(fd);
419003b705cfSriastradh			}
4191813957e3Ssnj		}
419203b705cfSriastradh
4193813957e3Ssnj		ret = do_execbuf(kgem, &execbuf);
419463ef14f0Smrg	} else
419563ef14f0Smrg		ret = -ENOMEM;
419603b705cfSriastradh
419763ef14f0Smrg	if (ret < 0) {
419863ef14f0Smrg		kgem_throttle(kgem);
419963ef14f0Smrg		if (!kgem->wedged) {
420063ef14f0Smrg			xf86DrvMsg(kgem_get_screen_index(kgem), X_ERROR,
420163ef14f0Smrg				   "Failed to submit rendering commands (%s), disabling acceleration.\n",
420263ef14f0Smrg				   strerror(-ret));
420363ef14f0Smrg			__kgem_set_wedged(kgem);
4204813957e3Ssnj		}
420503b705cfSriastradh
420603b705cfSriastradh#if !NDEBUG
420763ef14f0Smrg		ErrorF("batch[%d/%d]: %d %d %d, nreloc=%d, nexec=%d, nfence=%d, aperture=%d, fenced=%d, high=%d,%d: errno=%d\n",
420863ef14f0Smrg		       kgem->mode, kgem->ring, batch_end, kgem->nbatch, kgem->surface,
420963ef14f0Smrg		       kgem->nreloc, kgem->nexec, kgem->nfence, kgem->aperture, kgem->aperture_fenced, kgem->aperture_high, kgem->aperture_total, -ret);
421003b705cfSriastradh
421163ef14f0Smrg		for (i = 0; i < kgem->nexec; i++) {
421263ef14f0Smrg			struct kgem_bo *bo, *found = NULL;
421303b705cfSriastradh
421463ef14f0Smrg			list_for_each_entry(bo, &kgem->next_request->buffers, request) {
421563ef14f0Smrg				if (bo->handle == kgem->exec[i].handle) {
421663ef14f0Smrg					found = bo;
421763ef14f0Smrg					break;
421803b705cfSriastradh				}
4219813957e3Ssnj			}
422063ef14f0Smrg			ErrorF("exec[%d] = handle:%d, presumed offset: %x, size: %d, tiling %d, fenced %d, snooped %d, deleted %d\n",
422163ef14f0Smrg			       i,
422263ef14f0Smrg			       kgem->exec[i].handle,
422363ef14f0Smrg			       (int)kgem->exec[i].offset,
422463ef14f0Smrg			       found ? kgem_bo_size(found) : -1,
422563ef14f0Smrg			       found ? found->tiling : -1,
422663ef14f0Smrg			       (int)(kgem->exec[i].flags & EXEC_OBJECT_NEEDS_FENCE),
422763ef14f0Smrg			       found ? found->snoop : -1,
422863ef14f0Smrg			       found ? found->purged : -1);
422963ef14f0Smrg		}
423063ef14f0Smrg		for (i = 0; i < kgem->nreloc; i++) {
423163ef14f0Smrg			ErrorF("reloc[%d] = pos:%d, target:%d, delta:%d, read:%x, write:%x, offset:%x\n",
423263ef14f0Smrg			       i,
423363ef14f0Smrg			       (int)kgem->reloc[i].offset,
423463ef14f0Smrg			       kgem->reloc[i].target_handle,
423563ef14f0Smrg			       kgem->reloc[i].delta,
423663ef14f0Smrg			       kgem->reloc[i].read_domains,
423763ef14f0Smrg			       kgem->reloc[i].write_domain,
423863ef14f0Smrg			       (int)kgem->reloc[i].presumed_offset);
423963ef14f0Smrg		}
424063ef14f0Smrg
424163ef14f0Smrg		{
424263ef14f0Smrg			struct drm_i915_gem_get_aperture aperture;
424363ef14f0Smrg			if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_APERTURE, &aperture) == 0)
424463ef14f0Smrg				ErrorF("Aperture size %lld, available %lld\n",
424563ef14f0Smrg				       (long long)aperture.aper_size,
424663ef14f0Smrg				       (long long)aperture.aper_available_size);
424763ef14f0Smrg		}
424863ef14f0Smrg
424963ef14f0Smrg		if (ret == -ENOSPC)
425063ef14f0Smrg			dump_gtt_info(kgem);
425163ef14f0Smrg		if (ret == -EDEADLK)
425263ef14f0Smrg			dump_fence_regs(kgem);
425363ef14f0Smrg
425463ef14f0Smrg		if (DEBUG_SYNC) {
425563ef14f0Smrg			int fd = open("/tmp/batchbuffer", O_WRONLY | O_CREAT | O_APPEND, 0666);
425663ef14f0Smrg			if (fd != -1) {
425763ef14f0Smrg				int ignored = write(fd, kgem->batch, batch_end*sizeof(uint32_t));
425863ef14f0Smrg				assert(ignored == batch_end*sizeof(uint32_t));
425963ef14f0Smrg				close(fd);
4260813957e3Ssnj			}
426103b705cfSriastradh
426263ef14f0Smrg			FatalError("SNA: failed to submit batchbuffer, errno=%d\n", -ret);
426363ef14f0Smrg		}
426463ef14f0Smrg#endif
426563ef14f0Smrg	} else {
426663ef14f0Smrg		if (DEBUG_SYNC) {
426763ef14f0Smrg			struct drm_i915_gem_set_domain set_domain;
42689a906b70Schristos
426963ef14f0Smrg			VG_CLEAR(set_domain);
427063ef14f0Smrg			set_domain.handle = rq->bo->handle;
427163ef14f0Smrg			set_domain.read_domains = I915_GEM_DOMAIN_GTT;
427263ef14f0Smrg			set_domain.write_domain = I915_GEM_DOMAIN_GTT;
4273813957e3Ssnj
427463ef14f0Smrg			ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain);
427503b705cfSriastradh		}
427663ef14f0Smrg
42779a906b70Schristos#if SHOW_BATCH_AFTER
427863ef14f0Smrg		if (gem_read(kgem->fd, rq->bo->handle, kgem->batch, 0, batch_end*sizeof(uint32_t)) == 0)
427963ef14f0Smrg			__kgem_batch_debug(kgem, batch_end);
42809a906b70Schristos#endif
428163ef14f0Smrg
428263ef14f0Smrg		kgem_commit(kgem);
428363ef14f0Smrg	}
428463ef14f0Smrg
428563ef14f0Smrg	if (unlikely(kgem->wedged))
428603b705cfSriastradh		kgem_cleanup(kgem);
428703b705cfSriastradh
428803b705cfSriastradh	kgem_reset(kgem);
428903b705cfSriastradh
429003b705cfSriastradh	assert(kgem->next_request != NULL);
429103b705cfSriastradh}
429203b705cfSriastradh
429303b705cfSriastradhvoid kgem_throttle(struct kgem *kgem)
429403b705cfSriastradh{
429563ef14f0Smrg	if (unlikely(kgem->wedged))
429603b705cfSriastradh		return;
429703b705cfSriastradh
4298813957e3Ssnj	if (__kgem_throttle(kgem, true)) {
429903b705cfSriastradh		xf86DrvMsg(kgem_get_screen_index(kgem), X_ERROR,
430003b705cfSriastradh			   "Detected a hung GPU, disabling acceleration.\n");
4301813957e3Ssnj		__kgem_set_wedged(kgem);
43029a906b70Schristos		kgem->need_throttle = false;
430303b705cfSriastradh	}
430403b705cfSriastradh}
430503b705cfSriastradh
43069a906b70Schristosint kgem_is_wedged(struct kgem *kgem)
43079a906b70Schristos{
43089a906b70Schristos	return __kgem_throttle(kgem, true);
43099a906b70Schristos}
43109a906b70Schristos
43119a906b70Schristosstatic void kgem_purge_cache(struct kgem *kgem)
431203b705cfSriastradh{
431303b705cfSriastradh	struct kgem_bo *bo, *next;
431403b705cfSriastradh	int i;
431503b705cfSriastradh
431603b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) {
431703b705cfSriastradh		list_for_each_entry_safe(bo, next, &kgem->inactive[i], list) {
431803b705cfSriastradh			if (!kgem_bo_is_retained(kgem, bo)) {
431903b705cfSriastradh				DBG(("%s: purging %d\n",
432003b705cfSriastradh				     __FUNCTION__, bo->handle));
432103b705cfSriastradh				kgem_bo_free(kgem, bo);
432203b705cfSriastradh			}
432303b705cfSriastradh		}
432403b705cfSriastradh	}
432503b705cfSriastradh
432603b705cfSriastradh	kgem->need_purge = false;
432703b705cfSriastradh}
432803b705cfSriastradh
432903b705cfSriastradhvoid kgem_clean_scanout_cache(struct kgem *kgem)
433003b705cfSriastradh{
433103b705cfSriastradh	while (!list_is_empty(&kgem->scanout)) {
433203b705cfSriastradh		struct kgem_bo *bo;
433303b705cfSriastradh
433403b705cfSriastradh		bo = list_first_entry(&kgem->scanout, struct kgem_bo, list);
433503b705cfSriastradh
433603b705cfSriastradh		assert(bo->scanout);
433703b705cfSriastradh		assert(!bo->refcnt);
43389a906b70Schristos		assert(!bo->prime);
433903b705cfSriastradh		assert(bo->proxy == NULL);
434003b705cfSriastradh
434103b705cfSriastradh		if (bo->exec || __kgem_busy(kgem, bo->handle))
434203b705cfSriastradh			break;
434303b705cfSriastradh
434403b705cfSriastradh		DBG(("%s: handle=%d, fb=%d (reusable=%d)\n",
434503b705cfSriastradh		     __FUNCTION__, bo->handle, bo->delta, bo->reusable));
434603b705cfSriastradh		list_del(&bo->list);
434703b705cfSriastradh
43489a906b70Schristos		kgem_bo_rmfb(kgem, bo);
434903b705cfSriastradh		bo->scanout = false;
435003b705cfSriastradh
435103b705cfSriastradh		if (!bo->purged) {
435203b705cfSriastradh			bo->reusable = true;
435303b705cfSriastradh			if (kgem->has_llc &&
435403b705cfSriastradh			    !gem_set_caching(kgem->fd, bo->handle, SNOOPED))
435503b705cfSriastradh				bo->reusable = false;
435603b705cfSriastradh
435703b705cfSriastradh		}
435803b705cfSriastradh
435903b705cfSriastradh		__kgem_bo_destroy(kgem, bo);
436003b705cfSriastradh	}
436103b705cfSriastradh}
436203b705cfSriastradh
436303b705cfSriastradhvoid kgem_clean_large_cache(struct kgem *kgem)
436403b705cfSriastradh{
436503b705cfSriastradh	while (!list_is_empty(&kgem->large_inactive)) {
436603b705cfSriastradh		kgem_bo_free(kgem,
436703b705cfSriastradh			     list_first_entry(&kgem->large_inactive,
436803b705cfSriastradh					      struct kgem_bo, list));
436903b705cfSriastradh
437003b705cfSriastradh	}
437103b705cfSriastradh}
437203b705cfSriastradh
437303b705cfSriastradhbool kgem_expire_cache(struct kgem *kgem)
437403b705cfSriastradh{
437503b705cfSriastradh	time_t now, expire;
437603b705cfSriastradh	struct kgem_bo *bo;
437703b705cfSriastradh	unsigned int size = 0, count = 0;
437803b705cfSriastradh	bool idle;
437903b705cfSriastradh	unsigned int i;
438003b705cfSriastradh
438163ef14f0Smrg	if (!time(&now))
438263ef14f0Smrg		return false;
438303b705cfSriastradh
438403b705cfSriastradh	while (__kgem_freed_bo) {
438503b705cfSriastradh		bo = __kgem_freed_bo;
438603b705cfSriastradh		__kgem_freed_bo = *(struct kgem_bo **)bo;
438703b705cfSriastradh		free(bo);
438803b705cfSriastradh	}
438903b705cfSriastradh
439003b705cfSriastradh	while (__kgem_freed_request) {
439103b705cfSriastradh		struct kgem_request *rq = __kgem_freed_request;
439203b705cfSriastradh		__kgem_freed_request = *(struct kgem_request **)rq;
439303b705cfSriastradh		free(rq);
439403b705cfSriastradh	}
439503b705cfSriastradh
439603b705cfSriastradh	kgem_clean_large_cache(kgem);
439763ef14f0Smrg	if (__to_sna(kgem)->scrn->vtSema)
439803b705cfSriastradh		kgem_clean_scanout_cache(kgem);
439903b705cfSriastradh
440003b705cfSriastradh	expire = 0;
440103b705cfSriastradh	list_for_each_entry(bo, &kgem->snoop, list) {
440203b705cfSriastradh		if (bo->delta) {
440303b705cfSriastradh			expire = now - MAX_INACTIVE_TIME/2;
440403b705cfSriastradh			break;
440503b705cfSriastradh		}
440603b705cfSriastradh
440763ef14f0Smrg		assert(now);
440803b705cfSriastradh		bo->delta = now;
440903b705cfSriastradh	}
441003b705cfSriastradh	if (expire) {
441103b705cfSriastradh		while (!list_is_empty(&kgem->snoop)) {
441203b705cfSriastradh			bo = list_last_entry(&kgem->snoop, struct kgem_bo, list);
441303b705cfSriastradh
441403b705cfSriastradh			if (bo->delta > expire)
441503b705cfSriastradh				break;
441603b705cfSriastradh
441703b705cfSriastradh			kgem_bo_free(kgem, bo);
441803b705cfSriastradh		}
441903b705cfSriastradh	}
442003b705cfSriastradh#ifdef DEBUG_MEMORY
442103b705cfSriastradh	{
442203b705cfSriastradh		long snoop_size = 0;
442303b705cfSriastradh		int snoop_count = 0;
442403b705cfSriastradh		list_for_each_entry(bo, &kgem->snoop, list)
442503b705cfSriastradh			snoop_count++, snoop_size += bytes(bo);
44269a906b70Schristos		DBG(("%s: still allocated %d bo, %ld bytes, in snoop cache\n",
44279a906b70Schristos		     __FUNCTION__, snoop_count, snoop_size));
442803b705cfSriastradh	}
442903b705cfSriastradh#endif
443003b705cfSriastradh
443103b705cfSriastradh	kgem_retire(kgem);
443263ef14f0Smrg	if (unlikely(kgem->wedged))
443303b705cfSriastradh		kgem_cleanup(kgem);
443403b705cfSriastradh
443503b705cfSriastradh	kgem->expire(kgem);
443603b705cfSriastradh
443703b705cfSriastradh	if (kgem->need_purge)
443803b705cfSriastradh		kgem_purge_cache(kgem);
443903b705cfSriastradh
44409a906b70Schristos	if (kgem->need_retire)
44419a906b70Schristos		kgem_retire(kgem);
444203b705cfSriastradh
44439a906b70Schristos	expire = 0;
44449a906b70Schristos	idle = true;
444503b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) {
444603b705cfSriastradh		idle &= list_is_empty(&kgem->inactive[i]);
444703b705cfSriastradh		list_for_each_entry(bo, &kgem->inactive[i], list) {
444803b705cfSriastradh			if (bo->delta) {
444903b705cfSriastradh				expire = now - MAX_INACTIVE_TIME;
445003b705cfSriastradh				break;
445103b705cfSriastradh			}
445203b705cfSriastradh
445363ef14f0Smrg			assert(now);
445463ef14f0Smrg			kgem_bo_set_purgeable(kgem, bo);
445503b705cfSriastradh			bo->delta = now;
445603b705cfSriastradh		}
445703b705cfSriastradh	}
44589a906b70Schristos	if (expire == 0) {
44599a906b70Schristos		DBG(("%s: idle? %d\n", __FUNCTION__, idle));
44609a906b70Schristos		kgem->need_expire = !idle;
446103b705cfSriastradh		return false;
446203b705cfSriastradh	}
446303b705cfSriastradh
44649a906b70Schristos	idle = true;
446503b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) {
446603b705cfSriastradh		struct list preserve;
446703b705cfSriastradh
446803b705cfSriastradh		list_init(&preserve);
446903b705cfSriastradh		while (!list_is_empty(&kgem->inactive[i])) {
447003b705cfSriastradh			bo = list_last_entry(&kgem->inactive[i],
447103b705cfSriastradh					     struct kgem_bo, list);
447203b705cfSriastradh
447303b705cfSriastradh			if (bo->delta > expire) {
447403b705cfSriastradh				idle = false;
447503b705cfSriastradh				break;
447603b705cfSriastradh			}
447703b705cfSriastradh
44789a906b70Schristos			if (bo->map__cpu && bo->delta + MAP_PRESERVE_TIME > expire) {
447903b705cfSriastradh				idle = false;
448003b705cfSriastradh				list_move_tail(&bo->list, &preserve);
448103b705cfSriastradh			} else {
448203b705cfSriastradh				count++;
448303b705cfSriastradh				size += bytes(bo);
448403b705cfSriastradh				kgem_bo_free(kgem, bo);
448563ef14f0Smrg				DBG(("%s: expiring handle=%d\n",
448603b705cfSriastradh				     __FUNCTION__, bo->handle));
448703b705cfSriastradh			}
448803b705cfSriastradh		}
448963ef14f0Smrg		list_splice_tail(&preserve, &kgem->inactive[i]);
449003b705cfSriastradh	}
449103b705cfSriastradh
449203b705cfSriastradh#ifdef DEBUG_MEMORY
449303b705cfSriastradh	{
449403b705cfSriastradh		long inactive_size = 0;
449503b705cfSriastradh		int inactive_count = 0;
449603b705cfSriastradh		for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++)
449703b705cfSriastradh			list_for_each_entry(bo, &kgem->inactive[i], list)
449803b705cfSriastradh				inactive_count++, inactive_size += bytes(bo);
44999a906b70Schristos		DBG(("%s: still allocated %d bo, %ld bytes, in inactive cache\n",
45009a906b70Schristos		     __FUNCTION__, inactive_count, inactive_size));
450103b705cfSriastradh	}
450203b705cfSriastradh#endif
450303b705cfSriastradh
450403b705cfSriastradh	DBG(("%s: expired %d objects, %d bytes, idle? %d\n",
450503b705cfSriastradh	     __FUNCTION__, count, size, idle));
450603b705cfSriastradh
450703b705cfSriastradh	kgem->need_expire = !idle;
45089a906b70Schristos	return count;
450903b705cfSriastradh	(void)count;
451003b705cfSriastradh	(void)size;
451103b705cfSriastradh}
451203b705cfSriastradh
45139a906b70Schristosbool kgem_cleanup_cache(struct kgem *kgem)
451403b705cfSriastradh{
451503b705cfSriastradh	unsigned int i;
451603b705cfSriastradh	int n;
451703b705cfSriastradh
451863ef14f0Smrg	DBG(("%s\n", __FUNCTION__));
451963ef14f0Smrg
452003b705cfSriastradh	/* sync to the most recent request */
452103b705cfSriastradh	for (n = 0; n < ARRAY_SIZE(kgem->requests); n++) {
452203b705cfSriastradh		if (!list_is_empty(&kgem->requests[n])) {
452303b705cfSriastradh			struct kgem_request *rq;
452403b705cfSriastradh
452563ef14f0Smrg			rq = list_last_entry(&kgem->requests[n],
452663ef14f0Smrg					     struct kgem_request,
452763ef14f0Smrg					     list);
452803b705cfSriastradh
452903b705cfSriastradh			DBG(("%s: sync on cleanup\n", __FUNCTION__));
453063ef14f0Smrg			assert(rq->ring == n);
453163ef14f0Smrg			assert(rq->bo);
453263ef14f0Smrg			assert(RQ(rq->bo->rq) == rq);
453363ef14f0Smrg			kgem_bo_wait(kgem, rq->bo);
453403b705cfSriastradh		}
453563ef14f0Smrg		assert(list_is_empty(&kgem->requests[n]));
453603b705cfSriastradh	}
453703b705cfSriastradh
453803b705cfSriastradh	kgem_retire(kgem);
453903b705cfSriastradh	kgem_cleanup(kgem);
454003b705cfSriastradh
454163ef14f0Smrg	DBG(("%s: need_expire?=%d\n", __FUNCTION__, kgem->need_expire));
45429a906b70Schristos	if (!kgem->need_expire)
45439a906b70Schristos		return false;
45449a906b70Schristos
454503b705cfSriastradh	for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) {
454603b705cfSriastradh		while (!list_is_empty(&kgem->inactive[i]))
454703b705cfSriastradh			kgem_bo_free(kgem,
454803b705cfSriastradh				     list_last_entry(&kgem->inactive[i],
454903b705cfSriastradh						     struct kgem_bo, list));
455003b705cfSriastradh	}
455103b705cfSriastradh
455203b705cfSriastradh	kgem_clean_large_cache(kgem);
455303b705cfSriastradh	kgem_clean_scanout_cache(kgem);
455403b705cfSriastradh
455503b705cfSriastradh	while (!list_is_empty(&kgem->snoop))
455603b705cfSriastradh		kgem_bo_free(kgem,
455703b705cfSriastradh			     list_last_entry(&kgem->snoop,
455803b705cfSriastradh					     struct kgem_bo, list));
455903b705cfSriastradh
456003b705cfSriastradh	while (__kgem_freed_bo) {
456103b705cfSriastradh		struct kgem_bo *bo = __kgem_freed_bo;
456203b705cfSriastradh		__kgem_freed_bo = *(struct kgem_bo **)bo;
456303b705cfSriastradh		free(bo);
456403b705cfSriastradh	}
456503b705cfSriastradh
456603b705cfSriastradh	kgem->need_purge = false;
456703b705cfSriastradh	kgem->need_expire = false;
456863ef14f0Smrg
456963ef14f0Smrg	DBG(("%s: complete\n", __FUNCTION__));
45709a906b70Schristos	return true;
457103b705cfSriastradh}
457203b705cfSriastradh
457303b705cfSriastradhstatic struct kgem_bo *
457403b705cfSriastradhsearch_linear_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags)
457503b705cfSriastradh{
457603b705cfSriastradh	struct kgem_bo *bo, *first = NULL;
457703b705cfSriastradh	bool use_active = (flags & CREATE_INACTIVE) == 0;
457803b705cfSriastradh	struct list *cache;
457903b705cfSriastradh
458003b705cfSriastradh	DBG(("%s: num_pages=%d, flags=%x, use_active? %d, use_large=%d [max=%d]\n",
458103b705cfSriastradh	     __FUNCTION__, num_pages, flags, use_active,
458203b705cfSriastradh	     num_pages >= MAX_CACHE_SIZE / PAGE_SIZE,
458303b705cfSriastradh	     MAX_CACHE_SIZE / PAGE_SIZE));
458403b705cfSriastradh
458503b705cfSriastradh	assert(num_pages);
458603b705cfSriastradh
458703b705cfSriastradh	if (num_pages >= MAX_CACHE_SIZE / PAGE_SIZE) {
458803b705cfSriastradh		DBG(("%s: searching large buffers\n", __FUNCTION__));
458903b705cfSriastradhretry_large:
459003b705cfSriastradh		cache = use_active ? &kgem->large : &kgem->large_inactive;
459103b705cfSriastradh		list_for_each_entry_safe(bo, first, cache, list) {
459203b705cfSriastradh			assert(bo->refcnt == 0);
459303b705cfSriastradh			assert(bo->reusable);
459403b705cfSriastradh			assert(!bo->scanout);
459503b705cfSriastradh
459603b705cfSriastradh			if (num_pages > num_pages(bo))
459703b705cfSriastradh				goto discard;
459803b705cfSriastradh
459903b705cfSriastradh			if (bo->tiling != I915_TILING_NONE) {
460063ef14f0Smrg				if (use_active && kgem->gen < 040)
460103b705cfSriastradh					goto discard;
460203b705cfSriastradh
460363ef14f0Smrg				if (!kgem_set_tiling(kgem, bo,
460403b705cfSriastradh						    I915_TILING_NONE, 0))
460503b705cfSriastradh					goto discard;
460603b705cfSriastradh			}
460763ef14f0Smrg			assert(bo->tiling == I915_TILING_NONE);
460863ef14f0Smrg			bo->pitch = 0;
460903b705cfSriastradh
461003b705cfSriastradh			if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo))
461103b705cfSriastradh				goto discard;
461203b705cfSriastradh
461303b705cfSriastradh			list_del(&bo->list);
46149a906b70Schristos			if (RQ(bo->rq) == (void *)kgem) {
46159a906b70Schristos				assert(bo->exec == NULL);
461603b705cfSriastradh				list_del(&bo->request);
46179a906b70Schristos			}
461803b705cfSriastradh
461903b705cfSriastradh			bo->delta = 0;
462003b705cfSriastradh			assert_tiling(kgem, bo);
462103b705cfSriastradh			return bo;
462203b705cfSriastradh
462303b705cfSriastradhdiscard:
462403b705cfSriastradh			if (!use_active)
462503b705cfSriastradh				kgem_bo_free(kgem, bo);
462603b705cfSriastradh		}
462703b705cfSriastradh
462803b705cfSriastradh		if (use_active) {
462903b705cfSriastradh			use_active = false;
463003b705cfSriastradh			goto retry_large;
463103b705cfSriastradh		}
463203b705cfSriastradh
463303b705cfSriastradh		if (__kgem_throttle_retire(kgem, flags))
463403b705cfSriastradh			goto retry_large;
463503b705cfSriastradh
463603b705cfSriastradh		return NULL;
463703b705cfSriastradh	}
463803b705cfSriastradh
463903b705cfSriastradh	if (!use_active && list_is_empty(inactive(kgem, num_pages))) {
464003b705cfSriastradh		DBG(("%s: inactive and cache bucket empty\n",
464103b705cfSriastradh		     __FUNCTION__));
464203b705cfSriastradh
464303b705cfSriastradh		if (flags & CREATE_NO_RETIRE) {
464403b705cfSriastradh			DBG(("%s: can not retire\n", __FUNCTION__));
464503b705cfSriastradh			return NULL;
464603b705cfSriastradh		}
464703b705cfSriastradh
464803b705cfSriastradh		if (list_is_empty(active(kgem, num_pages, I915_TILING_NONE))) {
464903b705cfSriastradh			DBG(("%s: active cache bucket empty\n", __FUNCTION__));
465003b705cfSriastradh			return NULL;
465103b705cfSriastradh		}
465203b705cfSriastradh
465303b705cfSriastradh		if (!__kgem_throttle_retire(kgem, flags)) {
465403b705cfSriastradh			DBG(("%s: nothing retired\n", __FUNCTION__));
465503b705cfSriastradh			return NULL;
465603b705cfSriastradh		}
465703b705cfSriastradh
465803b705cfSriastradh		if (list_is_empty(inactive(kgem, num_pages))) {
465903b705cfSriastradh			DBG(("%s: active cache bucket still empty after retire\n",
466003b705cfSriastradh			     __FUNCTION__));
466103b705cfSriastradh			return NULL;
466203b705cfSriastradh		}
466303b705cfSriastradh	}
466403b705cfSriastradh
466503b705cfSriastradh	if (!use_active && flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) {
466603b705cfSriastradh		int for_cpu = !!(flags & CREATE_CPU_MAP);
466703b705cfSriastradh		DBG(("%s: searching for inactive %s map\n",
466803b705cfSriastradh		     __FUNCTION__, for_cpu ? "cpu" : "gtt"));
466903b705cfSriastradh		cache = &kgem->vma[for_cpu].inactive[cache_bucket(num_pages)];
467003b705cfSriastradh		list_for_each_entry(bo, cache, vma) {
4671813957e3Ssnj			assert(for_cpu ? !!bo->map__cpu : (bo->map__gtt || bo->map__wc));
467203b705cfSriastradh			assert(bucket(bo) == cache_bucket(num_pages));
467303b705cfSriastradh			assert(bo->proxy == NULL);
467403b705cfSriastradh			assert(bo->rq == NULL);
467503b705cfSriastradh			assert(bo->exec == NULL);
467603b705cfSriastradh			assert(!bo->scanout);
467703b705cfSriastradh
467803b705cfSriastradh			if (num_pages > num_pages(bo)) {
467903b705cfSriastradh				DBG(("inactive too small: %d < %d\n",
468003b705cfSriastradh				     num_pages(bo), num_pages));
468103b705cfSriastradh				continue;
468203b705cfSriastradh			}
468303b705cfSriastradh
468403b705cfSriastradh			if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) {
468503b705cfSriastradh				kgem_bo_free(kgem, bo);
468603b705cfSriastradh				break;
468703b705cfSriastradh			}
468803b705cfSriastradh
468963ef14f0Smrg			if (!kgem_set_tiling(kgem, bo, I915_TILING_NONE, 0)) {
469063ef14f0Smrg				kgem_bo_free(kgem, bo);
469163ef14f0Smrg				break;
469263ef14f0Smrg			}
469303b705cfSriastradh
469403b705cfSriastradh			kgem_bo_remove_from_inactive(kgem, bo);
46959a906b70Schristos			assert(list_is_empty(&bo->vma));
46969a906b70Schristos			assert(list_is_empty(&bo->list));
469703b705cfSriastradh
469863ef14f0Smrg			assert(bo->tiling == I915_TILING_NONE);
469963ef14f0Smrg			assert(bo->pitch == 0);
470003b705cfSriastradh			bo->delta = 0;
470103b705cfSriastradh			DBG(("  %s: found handle=%d (num_pages=%d) in linear vma cache\n",
470203b705cfSriastradh			     __FUNCTION__, bo->handle, num_pages(bo)));
470303b705cfSriastradh			assert(use_active || bo->domain != DOMAIN_GPU);
470403b705cfSriastradh			assert(!bo->needs_flush);
470503b705cfSriastradh			assert_tiling(kgem, bo);
470603b705cfSriastradh			ASSERT_MAYBE_IDLE(kgem, bo->handle, !use_active);
470703b705cfSriastradh			return bo;
470803b705cfSriastradh		}
470903b705cfSriastradh
471003b705cfSriastradh		if (flags & CREATE_EXACT)
471103b705cfSriastradh			return NULL;
471203b705cfSriastradh
471303b705cfSriastradh		if (flags & CREATE_CPU_MAP && !kgem->has_llc)
471403b705cfSriastradh			return NULL;
471503b705cfSriastradh	}
471603b705cfSriastradh
471703b705cfSriastradh	cache = use_active ? active(kgem, num_pages, I915_TILING_NONE) : inactive(kgem, num_pages);
471803b705cfSriastradh	list_for_each_entry(bo, cache, list) {
471903b705cfSriastradh		assert(bo->refcnt == 0);
472003b705cfSriastradh		assert(bo->reusable);
472103b705cfSriastradh		assert(!!bo->rq == !!use_active);
472203b705cfSriastradh		assert(bo->proxy == NULL);
472303b705cfSriastradh		assert(!bo->scanout);
472403b705cfSriastradh
472503b705cfSriastradh		if (num_pages > num_pages(bo))
472603b705cfSriastradh			continue;
472703b705cfSriastradh
472803b705cfSriastradh		if (use_active &&
472903b705cfSriastradh		    kgem->gen <= 040 &&
473003b705cfSriastradh		    bo->tiling != I915_TILING_NONE)
473103b705cfSriastradh			continue;
473203b705cfSriastradh
473303b705cfSriastradh		if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) {
473403b705cfSriastradh			kgem_bo_free(kgem, bo);
473503b705cfSriastradh			break;
473603b705cfSriastradh		}
473703b705cfSriastradh
473803b705cfSriastradh		if (I915_TILING_NONE != bo->tiling) {
473903b705cfSriastradh			if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP))
474003b705cfSriastradh				continue;
474103b705cfSriastradh
474203b705cfSriastradh			if (first)
474303b705cfSriastradh				continue;
474403b705cfSriastradh
474563ef14f0Smrg			if (!kgem_set_tiling(kgem, bo, I915_TILING_NONE, 0))
474603b705cfSriastradh				continue;
474703b705cfSriastradh		}
474863ef14f0Smrg		assert(bo->tiling == I915_TILING_NONE);
474963ef14f0Smrg		bo->pitch = 0;
475003b705cfSriastradh
4751813957e3Ssnj		if (bo->map__gtt || bo->map__wc || bo->map__cpu) {
475203b705cfSriastradh			if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) {
475303b705cfSriastradh				int for_cpu = !!(flags & CREATE_CPU_MAP);
4754813957e3Ssnj				if (for_cpu ? !!bo->map__cpu : (bo->map__gtt || bo->map__wc)){
475503b705cfSriastradh					if (first != NULL)
475603b705cfSriastradh						break;
475703b705cfSriastradh
475803b705cfSriastradh					first = bo;
475903b705cfSriastradh					continue;
476003b705cfSriastradh				}
476103b705cfSriastradh			} else {
476203b705cfSriastradh				if (first != NULL)
476303b705cfSriastradh					break;
476403b705cfSriastradh
476503b705cfSriastradh				first = bo;
476603b705cfSriastradh				continue;
476703b705cfSriastradh			}
476803b705cfSriastradh		} else {
47699a906b70Schristos			if (flags & CREATE_GTT_MAP && !kgem_bo_can_map(kgem, bo))
47709a906b70Schristos				continue;
47719a906b70Schristos
477203b705cfSriastradh			if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) {
477303b705cfSriastradh				if (first != NULL)
477403b705cfSriastradh					break;
477503b705cfSriastradh
477603b705cfSriastradh				first = bo;
477703b705cfSriastradh				continue;
477803b705cfSriastradh			}
477903b705cfSriastradh		}
478003b705cfSriastradh
478103b705cfSriastradh		if (use_active)
478203b705cfSriastradh			kgem_bo_remove_from_active(kgem, bo);
478303b705cfSriastradh		else
478403b705cfSriastradh			kgem_bo_remove_from_inactive(kgem, bo);
478503b705cfSriastradh
478603b705cfSriastradh		assert(bo->tiling == I915_TILING_NONE);
478763ef14f0Smrg		assert(bo->pitch == 0);
478803b705cfSriastradh		bo->delta = 0;
478903b705cfSriastradh		DBG(("  %s: found handle=%d (num_pages=%d) in linear %s cache\n",
479003b705cfSriastradh		     __FUNCTION__, bo->handle, num_pages(bo),
479103b705cfSriastradh		     use_active ? "active" : "inactive"));
479203b705cfSriastradh		assert(list_is_empty(&bo->list));
47939a906b70Schristos		assert(list_is_empty(&bo->vma));
479403b705cfSriastradh		assert(use_active || bo->domain != DOMAIN_GPU);
479503b705cfSriastradh		assert(!bo->needs_flush || use_active);
479603b705cfSriastradh		assert_tiling(kgem, bo);
479703b705cfSriastradh		ASSERT_MAYBE_IDLE(kgem, bo->handle, !use_active);
479803b705cfSriastradh		return bo;
479903b705cfSriastradh	}
480003b705cfSriastradh
480103b705cfSriastradh	if (first) {
480203b705cfSriastradh		assert(first->tiling == I915_TILING_NONE);
480303b705cfSriastradh
480403b705cfSriastradh		if (use_active)
480503b705cfSriastradh			kgem_bo_remove_from_active(kgem, first);
480603b705cfSriastradh		else
480703b705cfSriastradh			kgem_bo_remove_from_inactive(kgem, first);
480803b705cfSriastradh
480903b705cfSriastradh		first->pitch = 0;
481003b705cfSriastradh		first->delta = 0;
481103b705cfSriastradh		DBG(("  %s: found handle=%d (near-miss) (num_pages=%d) in linear %s cache\n",
481203b705cfSriastradh		     __FUNCTION__, first->handle, num_pages(first),
481303b705cfSriastradh		     use_active ? "active" : "inactive"));
481403b705cfSriastradh		assert(list_is_empty(&first->list));
48159a906b70Schristos		assert(list_is_empty(&first->vma));
481603b705cfSriastradh		assert(use_active || first->domain != DOMAIN_GPU);
481703b705cfSriastradh		assert(!first->needs_flush || use_active);
481803b705cfSriastradh		ASSERT_MAYBE_IDLE(kgem, first->handle, !use_active);
481903b705cfSriastradh		return first;
482003b705cfSriastradh	}
482103b705cfSriastradh
482203b705cfSriastradh	return NULL;
482303b705cfSriastradh}
482403b705cfSriastradh
482503b705cfSriastradhstruct kgem_bo *kgem_create_for_name(struct kgem *kgem, uint32_t name)
482603b705cfSriastradh{
482703b705cfSriastradh	struct drm_gem_open open_arg;
48289a906b70Schristos	struct drm_i915_gem_get_tiling tiling;
482903b705cfSriastradh	struct kgem_bo *bo;
483003b705cfSriastradh
483103b705cfSriastradh	DBG(("%s(name=%d)\n", __FUNCTION__, name));
483203b705cfSriastradh
483303b705cfSriastradh	VG_CLEAR(open_arg);
483403b705cfSriastradh	open_arg.name = name;
48359a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_GEM_OPEN, &open_arg))
483603b705cfSriastradh		return NULL;
483703b705cfSriastradh
483803b705cfSriastradh	DBG(("%s: new handle=%d\n", __FUNCTION__, open_arg.handle));
48399a906b70Schristos
48409a906b70Schristos	VG_CLEAR(tiling);
48419a906b70Schristos	tiling.handle = open_arg.handle;
48429a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling)) {
48439a906b70Schristos		DBG(("%s(name=%d) get-tiling failed, ret=%d\n", __FUNCTION__, name, errno));
48449a906b70Schristos		gem_close(kgem->fd, open_arg.handle);
48459a906b70Schristos		return NULL;
48469a906b70Schristos	}
48479a906b70Schristos
48489a906b70Schristos	DBG(("%s: handle=%d, tiling=%d\n", __FUNCTION__, tiling.handle, tiling.tiling_mode));
48499a906b70Schristos
485003b705cfSriastradh	bo = __kgem_bo_alloc(open_arg.handle, open_arg.size / PAGE_SIZE);
485103b705cfSriastradh	if (bo == NULL) {
485203b705cfSriastradh		gem_close(kgem->fd, open_arg.handle);
485303b705cfSriastradh		return NULL;
485403b705cfSriastradh	}
485503b705cfSriastradh
48569a906b70Schristos	bo->unique_id = kgem_get_unique_id(kgem);
48579a906b70Schristos	bo->tiling = tiling.tiling_mode;
48589a906b70Schristos	bo->prime = true;
485963ef14f0Smrg	bo->reusable = false;
486063ef14f0Smrg	kgem_bo_unclean(kgem, bo);
486103b705cfSriastradh
486203b705cfSriastradh	debug_alloc__bo(kgem, bo);
486303b705cfSriastradh	return bo;
486403b705cfSriastradh}
486503b705cfSriastradh
486603b705cfSriastradhstruct kgem_bo *kgem_create_for_prime(struct kgem *kgem, int name, uint32_t size)
486703b705cfSriastradh{
486803b705cfSriastradh#ifdef DRM_IOCTL_PRIME_FD_TO_HANDLE
486903b705cfSriastradh	struct drm_prime_handle args;
487003b705cfSriastradh	struct drm_i915_gem_get_tiling tiling;
48719a906b70Schristos	struct local_i915_gem_caching caching;
487203b705cfSriastradh	struct kgem_bo *bo;
48739a906b70Schristos	off_t seek;
487403b705cfSriastradh
487503b705cfSriastradh	DBG(("%s(name=%d)\n", __FUNCTION__, name));
487603b705cfSriastradh
487703b705cfSriastradh	VG_CLEAR(args);
487803b705cfSriastradh	args.fd = name;
487903b705cfSriastradh	args.flags = 0;
48809a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_PRIME_FD_TO_HANDLE, &args)) {
48819a906b70Schristos		DBG(("%s(name=%d) fd-to-handle failed, ret=%d\n", __FUNCTION__, name, errno));
488203b705cfSriastradh		return NULL;
48839a906b70Schristos	}
488403b705cfSriastradh
488503b705cfSriastradh	VG_CLEAR(tiling);
488603b705cfSriastradh	tiling.handle = args.handle;
48879a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling)) {
48889a906b70Schristos		DBG(("%s(name=%d) get-tiling failed, ret=%d\n", __FUNCTION__, name, errno));
488903b705cfSriastradh		gem_close(kgem->fd, args.handle);
489003b705cfSriastradh		return NULL;
489103b705cfSriastradh	}
489203b705cfSriastradh
48939a906b70Schristos	/* Query actual size, overriding specified if available */
48949a906b70Schristos	seek = lseek(args.fd, 0, SEEK_END);
48959a906b70Schristos	DBG(("%s: estimated size=%ld, actual=%lld\n",
48969a906b70Schristos	     __FUNCTION__, (long)size, (long long)seek));
48979a906b70Schristos	if (seek != -1) {
48989a906b70Schristos		if (size > seek) {
48999a906b70Schristos			DBG(("%s(name=%d) estimated required size [%d] is larger than actual [%ld]\n", __FUNCTION__, name, size, (long)seek));
49009a906b70Schristos			gem_close(kgem->fd, args.handle);
49019a906b70Schristos			return NULL;
49029a906b70Schristos		}
49039a906b70Schristos		size = seek;
49049a906b70Schristos	}
49059a906b70Schristos
490603b705cfSriastradh	DBG(("%s: new handle=%d, tiling=%d\n", __FUNCTION__,
490703b705cfSriastradh	     args.handle, tiling.tiling_mode));
490803b705cfSriastradh	bo = __kgem_bo_alloc(args.handle, NUM_PAGES(size));
490903b705cfSriastradh	if (bo == NULL) {
491003b705cfSriastradh		gem_close(kgem->fd, args.handle);
491103b705cfSriastradh		return NULL;
491203b705cfSriastradh	}
491303b705cfSriastradh
49149a906b70Schristos	bo->unique_id = kgem_get_unique_id(kgem);
491503b705cfSriastradh	bo->tiling = tiling.tiling_mode;
491603b705cfSriastradh	bo->reusable = false;
49179a906b70Schristos	bo->prime = true;
49189a906b70Schristos	bo->domain = DOMAIN_NONE;
49199a906b70Schristos
49209a906b70Schristos	/* is this a special bo (e.g. scanout or CPU coherent)? */
49219a906b70Schristos
49229a906b70Schristos	VG_CLEAR(caching);
49239a906b70Schristos	caching.handle = args.handle;
49249a906b70Schristos	caching.caching = kgem->has_llc;
49259a906b70Schristos	(void)drmIoctl(kgem->fd, LOCAL_IOCTL_I915_GEM_GET_CACHING, &caching);
49269a906b70Schristos	DBG(("%s: imported handle=%d has caching %d\n", __FUNCTION__, args.handle, caching.caching));
49279a906b70Schristos	switch (caching.caching) {
49289a906b70Schristos	case 0:
49299a906b70Schristos		if (kgem->has_llc) {
49309a906b70Schristos			DBG(("%s: interpreting handle=%d as a foreign scanout\n",
49319a906b70Schristos			     __FUNCTION__, args.handle));
49329a906b70Schristos			bo->scanout = true;
49339a906b70Schristos		}
49349a906b70Schristos		break;
49359a906b70Schristos	case 1:
49369a906b70Schristos		if (!kgem->has_llc) {
49379a906b70Schristos			DBG(("%s: interpreting handle=%d as a foreign snooped buffer\n",
49389a906b70Schristos			     __FUNCTION__, args.handle));
49399a906b70Schristos			bo->snoop = true;
49409a906b70Schristos			if (bo->tiling) {
49419a906b70Schristos				DBG(("%s: illegal snooped tiled buffer\n", __FUNCTION__));
49429a906b70Schristos				kgem_bo_free(kgem, bo);
49439a906b70Schristos				return NULL;
49449a906b70Schristos			}
49459a906b70Schristos		}
49469a906b70Schristos		break;
49479a906b70Schristos	case 2:
49489a906b70Schristos		DBG(("%s: interpreting handle=%d as a foreign scanout\n",
49499a906b70Schristos		     __FUNCTION__, args.handle));
49509a906b70Schristos		bo->scanout = true;
49519a906b70Schristos		break;
49529a906b70Schristos	}
495303b705cfSriastradh
495403b705cfSriastradh	debug_alloc__bo(kgem, bo);
495503b705cfSriastradh	return bo;
495603b705cfSriastradh#else
495703b705cfSriastradh	return NULL;
495803b705cfSriastradh#endif
495903b705cfSriastradh}
496003b705cfSriastradh
496103b705cfSriastradhint kgem_bo_export_to_prime(struct kgem *kgem, struct kgem_bo *bo)
496203b705cfSriastradh{
496303b705cfSriastradh#if defined(DRM_IOCTL_PRIME_HANDLE_TO_FD) && defined(O_CLOEXEC)
496403b705cfSriastradh	struct drm_prime_handle args;
496503b705cfSriastradh
496663ef14f0Smrg	assert(kgem_bo_is_fenced(kgem, bo));
496763ef14f0Smrg
496803b705cfSriastradh	VG_CLEAR(args);
496903b705cfSriastradh	args.handle = bo->handle;
497003b705cfSriastradh	args.flags = O_CLOEXEC;
497103b705cfSriastradh
49729a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_PRIME_HANDLE_TO_FD, &args))
497303b705cfSriastradh		return -1;
497403b705cfSriastradh
497503b705cfSriastradh	bo->reusable = false;
497603b705cfSriastradh	return args.fd;
497703b705cfSriastradh#else
497803b705cfSriastradh	return -1;
497903b705cfSriastradh#endif
498003b705cfSriastradh}
498103b705cfSriastradh
498203b705cfSriastradhstruct kgem_bo *kgem_create_linear(struct kgem *kgem, int size, unsigned flags)
498303b705cfSriastradh{
498403b705cfSriastradh	struct kgem_bo *bo;
498503b705cfSriastradh	uint32_t handle;
498603b705cfSriastradh
498703b705cfSriastradh	DBG(("%s(%d)\n", __FUNCTION__, size));
498803b705cfSriastradh	assert(size);
498903b705cfSriastradh
499003b705cfSriastradh	if (flags & CREATE_GTT_MAP && kgem->has_llc) {
499103b705cfSriastradh		flags &= ~CREATE_GTT_MAP;
499203b705cfSriastradh		flags |= CREATE_CPU_MAP;
499303b705cfSriastradh	}
499403b705cfSriastradh
499503b705cfSriastradh	size = NUM_PAGES(size);
4996813957e3Ssnj	if ((flags & CREATE_UNCACHED) == 0) {
4997813957e3Ssnj		bo = search_linear_cache(kgem, size, CREATE_INACTIVE | flags);
4998813957e3Ssnj		if (bo) {
499963ef14f0Smrg			assert(!bo->purged);
500063ef14f0Smrg			assert(!bo->delta);
5001813957e3Ssnj			assert(bo->domain != DOMAIN_GPU);
5002813957e3Ssnj			ASSERT_IDLE(kgem, bo->handle);
5003813957e3Ssnj			bo->refcnt = 1;
5004813957e3Ssnj			return bo;
5005813957e3Ssnj		}
500603b705cfSriastradh
5007813957e3Ssnj		if (flags & CREATE_CACHED)
5008813957e3Ssnj			return NULL;
5009813957e3Ssnj	}
501003b705cfSriastradh
501103b705cfSriastradh	handle = gem_create(kgem->fd, size);
501203b705cfSriastradh	if (handle == 0)
501303b705cfSriastradh		return NULL;
501403b705cfSriastradh
501503b705cfSriastradh	DBG(("%s: new handle=%d, num_pages=%d\n", __FUNCTION__, handle, size));
501603b705cfSriastradh	bo = __kgem_bo_alloc(handle, size);
501703b705cfSriastradh	if (bo == NULL) {
501803b705cfSriastradh		gem_close(kgem->fd, handle);
501903b705cfSriastradh		return NULL;
502003b705cfSriastradh	}
502103b705cfSriastradh
502203b705cfSriastradh	debug_alloc__bo(kgem, bo);
502303b705cfSriastradh	return bo;
502403b705cfSriastradh}
502503b705cfSriastradh
502603b705cfSriastradhint kgem_choose_tiling(struct kgem *kgem, int tiling, int width, int height, int bpp)
502703b705cfSriastradh{
502803b705cfSriastradh	if (DBG_NO_TILING)
502903b705cfSriastradh		return tiling < 0 ? tiling : I915_TILING_NONE;
503003b705cfSriastradh
503103b705cfSriastradh	if (kgem->gen < 040) {
503203b705cfSriastradh		if (tiling && width * bpp > 8192 * 8) {
503303b705cfSriastradh			DBG(("%s: pitch too large for tliing [%d]\n",
503403b705cfSriastradh			     __FUNCTION__, width*bpp/8));
503503b705cfSriastradh			tiling = I915_TILING_NONE;
503603b705cfSriastradh			goto done;
503703b705cfSriastradh		}
503803b705cfSriastradh	} else {
503903b705cfSriastradh		if (width*bpp > (MAXSHORT-512) * 8) {
504003b705cfSriastradh			if (tiling > 0)
504103b705cfSriastradh				tiling = -tiling;
504203b705cfSriastradh			else if (tiling == 0)
504303b705cfSriastradh				tiling = -I915_TILING_X;
504403b705cfSriastradh			DBG(("%s: large pitch [%d], forcing TILING [%d]\n",
504503b705cfSriastradh			     __FUNCTION__, width*bpp/8, tiling));
504603b705cfSriastradh		} else if (tiling && (width|height) > 8192) {
504703b705cfSriastradh			DBG(("%s: large tiled buffer [%dx%d], forcing TILING_X\n",
504803b705cfSriastradh			     __FUNCTION__, width, height));
504903b705cfSriastradh			tiling = -I915_TILING_X;
505003b705cfSriastradh		}
505103b705cfSriastradh
505203b705cfSriastradh		/* fences limited to 128k (256k on ivb) */
505303b705cfSriastradh		assert(width * bpp <= 128 * 1024 * 8);
505403b705cfSriastradh	}
505503b705cfSriastradh
505603b705cfSriastradh	if (tiling < 0)
505703b705cfSriastradh		return tiling;
505803b705cfSriastradh
50599a906b70Schristos	if (tiling == I915_TILING_Y && !kgem->can_render_y)
50609a906b70Schristos		tiling = I915_TILING_X;
50619a906b70Schristos
506203b705cfSriastradh	if (tiling && (height == 1 || width == 1)) {
506303b705cfSriastradh		DBG(("%s: disabling tiling [%dx%d] for single row/col\n",
506403b705cfSriastradh		     __FUNCTION__,width, height));
506503b705cfSriastradh		tiling = I915_TILING_NONE;
506603b705cfSriastradh		goto done;
506703b705cfSriastradh	}
506803b705cfSriastradh	if (tiling == I915_TILING_Y && height <= 16) {
506903b705cfSriastradh		DBG(("%s: too short [%d] for TILING_Y\n",
507003b705cfSriastradh		     __FUNCTION__,height));
507103b705cfSriastradh		tiling = I915_TILING_X;
507203b705cfSriastradh	}
507303b705cfSriastradh	if (tiling && width * bpp > 8 * (4096 - 64)) {
507403b705cfSriastradh		DBG(("%s: TLB miss between lines %dx%d (pitch=%d), forcing tiling %d\n",
507503b705cfSriastradh		     __FUNCTION__,
507603b705cfSriastradh		     width, height, width*bpp/8,
507703b705cfSriastradh		     tiling));
507803b705cfSriastradh		return -tiling;
507903b705cfSriastradh	}
508003b705cfSriastradh	if (tiling == I915_TILING_X && height < 4) {
508103b705cfSriastradh		DBG(("%s: too short [%d] for TILING_X\n",
508203b705cfSriastradh		     __FUNCTION__, height));
508303b705cfSriastradh		tiling = I915_TILING_NONE;
508403b705cfSriastradh		goto done;
508503b705cfSriastradh	}
508603b705cfSriastradh
50879a906b70Schristos	if (tiling == I915_TILING_X && width * bpp <= 8*512) {
508803b705cfSriastradh		DBG(("%s: too thin [width %d, %d bpp] for TILING_X\n",
508903b705cfSriastradh		     __FUNCTION__, width, bpp));
509003b705cfSriastradh		tiling = I915_TILING_NONE;
509103b705cfSriastradh		goto done;
509203b705cfSriastradh	}
50939a906b70Schristos	if (tiling == I915_TILING_Y && width * bpp < 8*128) {
509403b705cfSriastradh		DBG(("%s: too thin [%d] for TILING_Y\n",
509503b705cfSriastradh		     __FUNCTION__, width));
509603b705cfSriastradh		tiling = I915_TILING_NONE;
509703b705cfSriastradh		goto done;
509803b705cfSriastradh	}
509903b705cfSriastradh
510003b705cfSriastradh	if (tiling && ALIGN(height, 2) * ALIGN(width*bpp, 8*64) <= 4096 * 8) {
510103b705cfSriastradh		DBG(("%s: too small [%d bytes] for TILING_%c\n", __FUNCTION__,
510203b705cfSriastradh		     ALIGN(height, 2) * ALIGN(width*bpp, 8*64) / 8,
510303b705cfSriastradh		     tiling == I915_TILING_X ? 'X' : 'Y'));
510403b705cfSriastradh		tiling = I915_TILING_NONE;
510503b705cfSriastradh		goto done;
510603b705cfSriastradh	}
510703b705cfSriastradh
510803b705cfSriastradh	if (tiling && width * bpp >= 8 * 4096 / 2) {
510903b705cfSriastradh		DBG(("%s: TLB near-miss between lines %dx%d (pitch=%d), forcing tiling %d\n",
511003b705cfSriastradh		     __FUNCTION__,
511103b705cfSriastradh		     width, height, width*bpp/8,
511203b705cfSriastradh		     tiling));
511303b705cfSriastradh		return -tiling;
511403b705cfSriastradh	}
511503b705cfSriastradh
511603b705cfSriastradhdone:
511703b705cfSriastradh	DBG(("%s: %dx%d -> %d\n", __FUNCTION__, width, height, tiling));
511803b705cfSriastradh	return tiling;
511903b705cfSriastradh}
512003b705cfSriastradh
512103b705cfSriastradhstatic int bits_per_pixel(int depth)
512203b705cfSriastradh{
512303b705cfSriastradh	switch (depth) {
512403b705cfSriastradh	case 8: return 8;
512503b705cfSriastradh	case 15:
512603b705cfSriastradh	case 16: return 16;
512703b705cfSriastradh	case 24:
512803b705cfSriastradh	case 30:
512903b705cfSriastradh	case 32: return 32;
513003b705cfSriastradh	default: return 0;
513103b705cfSriastradh	}
513203b705cfSriastradh}
513303b705cfSriastradh
513403b705cfSriastradhunsigned kgem_can_create_2d(struct kgem *kgem,
513503b705cfSriastradh			    int width, int height, int depth)
513603b705cfSriastradh{
513703b705cfSriastradh	uint32_t pitch, size;
513803b705cfSriastradh	unsigned flags = 0;
513903b705cfSriastradh	int tiling;
514003b705cfSriastradh	int bpp;
514103b705cfSriastradh
514203b705cfSriastradh	DBG(("%s: %dx%d @ %d\n", __FUNCTION__, width, height, depth));
514303b705cfSriastradh
514403b705cfSriastradh	bpp = bits_per_pixel(depth);
514503b705cfSriastradh	if (bpp == 0) {
514603b705cfSriastradh		DBG(("%s: unhandled depth %d\n", __FUNCTION__, depth));
514703b705cfSriastradh		return 0;
514803b705cfSriastradh	}
514903b705cfSriastradh
515003b705cfSriastradh	if (width > MAXSHORT || height > MAXSHORT) {
515103b705cfSriastradh		DBG(("%s: unhandled size %dx%d\n",
515203b705cfSriastradh		     __FUNCTION__, width, height));
515303b705cfSriastradh		return 0;
515403b705cfSriastradh	}
515503b705cfSriastradh
515603b705cfSriastradh	size = kgem_surface_size(kgem, false, 0,
515703b705cfSriastradh				 width, height, bpp,
515803b705cfSriastradh				 I915_TILING_NONE, &pitch);
515903b705cfSriastradh	DBG(("%s: untiled size=%d\n", __FUNCTION__, size));
516003b705cfSriastradh	if (size > 0) {
516103b705cfSriastradh		if (size <= kgem->max_cpu_size)
516203b705cfSriastradh			flags |= KGEM_CAN_CREATE_CPU;
51639a906b70Schristos		if (size > 4096 && size <= kgem->max_gpu_size)
516403b705cfSriastradh			flags |= KGEM_CAN_CREATE_GPU;
5165813957e3Ssnj		if (size <= PAGE_SIZE*kgem->aperture_mappable/4 || kgem->has_wc_mmap)
516603b705cfSriastradh			flags |= KGEM_CAN_CREATE_GTT;
516703b705cfSriastradh		if (size > kgem->large_object_size)
516803b705cfSriastradh			flags |= KGEM_CAN_CREATE_LARGE;
516903b705cfSriastradh		if (size > kgem->max_object_size) {
517003b705cfSriastradh			DBG(("%s: too large (untiled) %d > %d\n",
517103b705cfSriastradh			     __FUNCTION__, size, kgem->max_object_size));
517203b705cfSriastradh			return 0;
517303b705cfSriastradh		}
517403b705cfSriastradh	}
517503b705cfSriastradh
517603b705cfSriastradh	tiling = kgem_choose_tiling(kgem, I915_TILING_X,
517703b705cfSriastradh				    width, height, bpp);
517803b705cfSriastradh	if (tiling != I915_TILING_NONE) {
517903b705cfSriastradh		size = kgem_surface_size(kgem, false, 0,
518003b705cfSriastradh					 width, height, bpp, tiling,
518103b705cfSriastradh					 &pitch);
518203b705cfSriastradh		DBG(("%s: tiled[%d] size=%d\n", __FUNCTION__, tiling, size));
518303b705cfSriastradh		if (size > 0 && size <= kgem->max_gpu_size)
51849a906b70Schristos			flags |= KGEM_CAN_CREATE_GPU | KGEM_CAN_CREATE_TILED;
51859a906b70Schristos		if (size > 0 && size <= PAGE_SIZE*kgem->aperture_mappable/4)
518603b705cfSriastradh			flags |= KGEM_CAN_CREATE_GTT;
51879a906b70Schristos		if (size > PAGE_SIZE*kgem->aperture_mappable/4)
51889a906b70Schristos			flags &= ~KGEM_CAN_CREATE_GTT;
518903b705cfSriastradh		if (size > kgem->large_object_size)
519003b705cfSriastradh			flags |= KGEM_CAN_CREATE_LARGE;
519103b705cfSriastradh		if (size > kgem->max_object_size) {
519203b705cfSriastradh			DBG(("%s: too large (tiled) %d > %d\n",
519303b705cfSriastradh			     __FUNCTION__, size, kgem->max_object_size));
519403b705cfSriastradh			return 0;
519503b705cfSriastradh		}
51969a906b70Schristos		if (kgem->gen < 040) {
51979a906b70Schristos			int fence_size = 1024 * 1024;
51989a906b70Schristos			while (fence_size < size)
51999a906b70Schristos				fence_size <<= 1;
52009a906b70Schristos			if (fence_size > kgem->max_gpu_size)
52019a906b70Schristos				flags &= ~KGEM_CAN_CREATE_GPU | KGEM_CAN_CREATE_TILED;
52029a906b70Schristos			if (fence_size > PAGE_SIZE*kgem->aperture_fenceable/4)
52039a906b70Schristos				flags &= ~KGEM_CAN_CREATE_GTT;
52049a906b70Schristos		}
520503b705cfSriastradh	}
520603b705cfSriastradh
520703b705cfSriastradh	return flags;
520803b705cfSriastradh}
520903b705cfSriastradh
521003b705cfSriastradhinline int kgem_bo_fenced_size(struct kgem *kgem, struct kgem_bo *bo)
521103b705cfSriastradh{
521203b705cfSriastradh	unsigned int size;
521303b705cfSriastradh
521403b705cfSriastradh	assert(bo->tiling);
521503b705cfSriastradh	assert_tiling(kgem, bo);
521603b705cfSriastradh	assert(kgem->gen < 040);
521703b705cfSriastradh
521803b705cfSriastradh	if (kgem->gen < 030)
52199a906b70Schristos		size = 512 * 1024 / PAGE_SIZE;
522003b705cfSriastradh	else
52219a906b70Schristos		size = 1024 * 1024 / PAGE_SIZE;
52229a906b70Schristos	while (size < num_pages(bo))
52239a906b70Schristos		size <<= 1;
522403b705cfSriastradh
522503b705cfSriastradh	return size;
522603b705cfSriastradh}
522703b705cfSriastradh
522803b705cfSriastradhstatic struct kgem_bo *
522903b705cfSriastradh__kgem_bo_create_as_display(struct kgem *kgem, int size, int tiling, int pitch)
523003b705cfSriastradh{
523103b705cfSriastradh	struct local_i915_gem_create2 args;
523203b705cfSriastradh	struct kgem_bo *bo;
523303b705cfSriastradh
523403b705cfSriastradh	if (!kgem->has_create2)
523503b705cfSriastradh		return NULL;
523603b705cfSriastradh
523703b705cfSriastradh	memset(&args, 0, sizeof(args));
523803b705cfSriastradh	args.size = size * PAGE_SIZE;
523903b705cfSriastradh	args.placement = LOCAL_I915_CREATE_PLACEMENT_STOLEN;
524003b705cfSriastradh	args.caching = DISPLAY;
524103b705cfSriastradh	args.tiling_mode = tiling;
524203b705cfSriastradh	args.stride = pitch;
524303b705cfSriastradh
52449a906b70Schristos	if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_CREATE2, &args)) {
524503b705cfSriastradh		args.placement = LOCAL_I915_CREATE_PLACEMENT_SYSTEM;
52469a906b70Schristos		if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_CREATE2, &args))
524703b705cfSriastradh			return NULL;
524803b705cfSriastradh	}
524903b705cfSriastradh
525003b705cfSriastradh	bo = __kgem_bo_alloc(args.handle, size);
525103b705cfSriastradh	if (bo == NULL) {
525203b705cfSriastradh		gem_close(kgem->fd, args.handle);
525303b705cfSriastradh		return NULL;
525403b705cfSriastradh	}
525503b705cfSriastradh
525603b705cfSriastradh	bo->unique_id = kgem_get_unique_id(kgem);
525703b705cfSriastradh	bo->tiling = tiling;
525803b705cfSriastradh	bo->pitch = pitch;
525903b705cfSriastradh	if (args.placement == LOCAL_I915_CREATE_PLACEMENT_STOLEN) {
526003b705cfSriastradh		bo->purged = true; /* for asserts against CPU access */
526103b705cfSriastradh	}
526203b705cfSriastradh	bo->reusable = false; /* so that unclaimed scanouts are freed */
526303b705cfSriastradh	bo->domain = DOMAIN_NONE;
526403b705cfSriastradh
526503b705cfSriastradh	if (__kgem_busy(kgem, bo->handle)) {
52669a906b70Schristos		assert(bo->exec == NULL);
526703b705cfSriastradh		list_add(&bo->request, &kgem->flushing);
526803b705cfSriastradh		bo->rq = (void *)kgem;
52699a906b70Schristos		kgem->need_retire = true;
527003b705cfSriastradh	}
527103b705cfSriastradh
527203b705cfSriastradh	assert_tiling(kgem, bo);
527303b705cfSriastradh	debug_alloc__bo(kgem, bo);
527403b705cfSriastradh
527503b705cfSriastradh	return bo;
527603b705cfSriastradh}
527703b705cfSriastradh
52789a906b70Schristosstatic void __kgem_bo_make_scanout(struct kgem *kgem,
52799a906b70Schristos				   struct kgem_bo *bo,
52809a906b70Schristos				   int width, int height)
52819a906b70Schristos{
528263ef14f0Smrg	ScrnInfoPtr scrn = __to_sna(kgem)->scrn;
52839a906b70Schristos	struct drm_mode_fb_cmd arg;
52849a906b70Schristos
52859a906b70Schristos	assert(bo->proxy == NULL);
52869a906b70Schristos
52879a906b70Schristos	if (!scrn->vtSema)
52889a906b70Schristos		return;
52899a906b70Schristos
52909a906b70Schristos	DBG(("%s: create fb %dx%d@%d/%d\n",
52919a906b70Schristos	     __FUNCTION__, width, height, scrn->depth, scrn->bitsPerPixel));
52929a906b70Schristos
52939a906b70Schristos	VG_CLEAR(arg);
52949a906b70Schristos	arg.width = width;
52959a906b70Schristos	arg.height = height;
52969a906b70Schristos	arg.pitch = bo->pitch;
52979a906b70Schristos	arg.bpp = scrn->bitsPerPixel;
52989a906b70Schristos	arg.depth = scrn->depth;
52999a906b70Schristos	arg.handle = bo->handle;
53009a906b70Schristos
53019a906b70Schristos	/* First move the scanout out of cached memory */
53029a906b70Schristos	if (kgem->has_llc) {
53039a906b70Schristos		if (!gem_set_caching(kgem->fd, bo->handle, DISPLAY) &&
53049a906b70Schristos		    !gem_set_caching(kgem->fd, bo->handle, UNCACHED))
53059a906b70Schristos			return;
53069a906b70Schristos	}
53079a906b70Schristos
53089a906b70Schristos	bo->scanout = true;
53099a906b70Schristos
53109a906b70Schristos	/* Then pre-emptively move the object into the mappable
53119a906b70Schristos	 * portion to avoid rebinding later when busy.
53129a906b70Schristos	 */
53139a906b70Schristos	if (bo->map__gtt == NULL)
53149a906b70Schristos		bo->map__gtt = __kgem_bo_map__gtt(kgem, bo);
53159a906b70Schristos	if (bo->map__gtt) {
5316813957e3Ssnj		if (sigtrap_get() == 0) {
5317813957e3Ssnj			*(uint32_t *)bo->map__gtt = 0;
5318813957e3Ssnj			sigtrap_put();
5319813957e3Ssnj		}
53209a906b70Schristos		bo->domain = DOMAIN_GTT;
53219a906b70Schristos	}
53229a906b70Schristos
53239a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &arg) == 0) {
53249a906b70Schristos		DBG(("%s: attached fb=%d to handle=%d\n",
53259a906b70Schristos		     __FUNCTION__, arg.fb_id, arg.handle));
53269a906b70Schristos		bo->delta = arg.fb_id;
53279a906b70Schristos	}
53289a906b70Schristos}
53299a906b70Schristos
533063ef14f0Smrgstatic bool tiling_changed(struct kgem_bo *bo, int tiling, int pitch)
533163ef14f0Smrg{
533263ef14f0Smrg	if (tiling != bo->tiling)
533363ef14f0Smrg		return true;
533463ef14f0Smrg
533563ef14f0Smrg	return tiling != I915_TILING_NONE && pitch != bo->pitch;
533663ef14f0Smrg}
533763ef14f0Smrg
533863ef14f0Smrgstatic void set_gpu_tiling(struct kgem *kgem,
533963ef14f0Smrg			   struct kgem_bo *bo,
534063ef14f0Smrg			   int tiling, int pitch)
534163ef14f0Smrg{
534263ef14f0Smrg	DBG(("%s: handle=%d, tiling=%d, pitch=%d\n",
534363ef14f0Smrg	     __FUNCTION__, bo->handle, tiling, pitch));
534463ef14f0Smrg
534563ef14f0Smrg	if (tiling_changed(bo, tiling, pitch) && bo->map__gtt) {
534663ef14f0Smrg		if (!list_is_empty(&bo->vma)) {
534763ef14f0Smrg			list_del(&bo->vma);
534863ef14f0Smrg			kgem->vma[0].count--;
534963ef14f0Smrg		}
535063ef14f0Smrg		munmap(bo->map__gtt, bytes(bo));
535163ef14f0Smrg		bo->map__gtt = NULL;
535263ef14f0Smrg	}
535363ef14f0Smrg
535463ef14f0Smrg	bo->tiling = tiling;
535563ef14f0Smrg	bo->pitch = pitch;
535663ef14f0Smrg}
535763ef14f0Smrg
535863ef14f0Smrgbool kgem_bo_is_fenced(struct kgem *kgem, struct kgem_bo *bo)
535963ef14f0Smrg{
536063ef14f0Smrg	struct drm_i915_gem_get_tiling tiling;
536163ef14f0Smrg
536263ef14f0Smrg	assert(kgem);
536363ef14f0Smrg	assert(bo);
536463ef14f0Smrg
536563ef14f0Smrg	VG_CLEAR(tiling);
536663ef14f0Smrg	tiling.handle = bo->handle;
536763ef14f0Smrg	tiling.tiling_mode = bo->tiling;
536863ef14f0Smrg	(void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling);
536963ef14f0Smrg	return tiling.tiling_mode == bo->tiling; /* assume pitch is fine! */
537063ef14f0Smrg}
537163ef14f0Smrg
537203b705cfSriastradhstruct kgem_bo *kgem_create_2d(struct kgem *kgem,
537303b705cfSriastradh			       int width,
537403b705cfSriastradh			       int height,
537503b705cfSriastradh			       int bpp,
537603b705cfSriastradh			       int tiling,
537703b705cfSriastradh			       uint32_t flags)
537803b705cfSriastradh{
537903b705cfSriastradh	struct list *cache;
538003b705cfSriastradh	struct kgem_bo *bo;
538103b705cfSriastradh	uint32_t pitch, tiled_height, size;
538203b705cfSriastradh	uint32_t handle;
538303b705cfSriastradh	int i, bucket, retry;
538403b705cfSriastradh	bool exact = flags & (CREATE_EXACT | CREATE_SCANOUT);
538503b705cfSriastradh
538603b705cfSriastradh	if (tiling < 0)
538703b705cfSriastradh		exact = true, tiling = -tiling;
538803b705cfSriastradh
538903b705cfSriastradh	DBG(("%s(%dx%d, bpp=%d, tiling=%d, exact=%d, inactive=%d, cpu-mapping=%d, gtt-mapping=%d, scanout?=%d, prime?=%d, temp?=%d)\n", __FUNCTION__,
539003b705cfSriastradh	     width, height, bpp, tiling, exact,
539103b705cfSriastradh	     !!(flags & CREATE_INACTIVE),
539203b705cfSriastradh	     !!(flags & CREATE_CPU_MAP),
539303b705cfSriastradh	     !!(flags & CREATE_GTT_MAP),
539403b705cfSriastradh	     !!(flags & CREATE_SCANOUT),
539503b705cfSriastradh	     !!(flags & CREATE_PRIME),
539603b705cfSriastradh	     !!(flags & CREATE_TEMPORARY)));
539703b705cfSriastradh
539803b705cfSriastradh	size = kgem_surface_size(kgem, kgem->has_relaxed_fencing, flags,
539903b705cfSriastradh				 width, height, bpp, tiling, &pitch);
54009a906b70Schristos	if (size == 0) {
54019a906b70Schristos		DBG(("%s: invalid surface size (too large?)\n", __FUNCTION__));
54029a906b70Schristos		return NULL;
54039a906b70Schristos	}
54049a906b70Schristos
540503b705cfSriastradh	size /= PAGE_SIZE;
540603b705cfSriastradh	bucket = cache_bucket(size);
540703b705cfSriastradh
540803b705cfSriastradh	if (flags & CREATE_SCANOUT) {
540903b705cfSriastradh		struct kgem_bo *last = NULL;
541003b705cfSriastradh
541103b705cfSriastradh		list_for_each_entry_reverse(bo, &kgem->scanout, list) {
541203b705cfSriastradh			assert(bo->scanout);
541303b705cfSriastradh			assert(!bo->flush);
54149a906b70Schristos			assert(!bo->refcnt);
541503b705cfSriastradh			assert_tiling(kgem, bo);
541603b705cfSriastradh
541703b705cfSriastradh			if (size > num_pages(bo) || num_pages(bo) > 2*size)
541803b705cfSriastradh				continue;
541903b705cfSriastradh
54209a906b70Schristos			if (bo->tiling != tiling || bo->pitch != pitch)
54219a906b70Schristos				/* No tiling/pitch without recreating fb */
542203b705cfSriastradh				continue;
542303b705cfSriastradh
54249a906b70Schristos			if (bo->delta && !check_scanout_size(kgem, bo, width, height))
542563ef14f0Smrg				kgem_bo_rmfb(kgem, bo);
542603b705cfSriastradh
542703b705cfSriastradh			if (flags & CREATE_INACTIVE && bo->rq) {
542803b705cfSriastradh				last = bo;
542903b705cfSriastradh				continue;
543003b705cfSriastradh			}
543103b705cfSriastradh
543203b705cfSriastradh			list_del(&bo->list);
543303b705cfSriastradh
543403b705cfSriastradh			bo->unique_id = kgem_get_unique_id(kgem);
543503b705cfSriastradh			DBG(("  1:from scanout: pitch=%d, tiling=%d, handle=%d, id=%d\n",
543603b705cfSriastradh			     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
543703b705cfSriastradh			assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
543803b705cfSriastradh			assert_tiling(kgem, bo);
543903b705cfSriastradh			bo->refcnt = 1;
544003b705cfSriastradh			return bo;
544103b705cfSriastradh		}
544203b705cfSriastradh
544303b705cfSriastradh		if (last) {
544403b705cfSriastradh			list_del(&last->list);
544503b705cfSriastradh
544603b705cfSriastradh			last->unique_id = kgem_get_unique_id(kgem);
544703b705cfSriastradh			DBG(("  1:from scanout: pitch=%d, tiling=%d, handle=%d, id=%d\n",
544803b705cfSriastradh			     last->pitch, last->tiling, last->handle, last->unique_id));
544903b705cfSriastradh			assert(last->pitch*kgem_aligned_height(kgem, height, last->tiling) <= kgem_bo_size(last));
545003b705cfSriastradh			assert_tiling(kgem, last);
545103b705cfSriastradh			last->refcnt = 1;
545203b705cfSriastradh			return last;
545303b705cfSriastradh		}
545403b705cfSriastradh
545563ef14f0Smrg		if (__to_sna(kgem)->scrn->vtSema) {
545663ef14f0Smrg			ScrnInfoPtr scrn = __to_sna(kgem)->scrn;
54579a906b70Schristos
54589a906b70Schristos			list_for_each_entry_reverse(bo, &kgem->scanout, list) {
54599a906b70Schristos				struct drm_mode_fb_cmd arg;
54609a906b70Schristos
54619a906b70Schristos				assert(bo->scanout);
54629a906b70Schristos				assert(!bo->refcnt);
54639a906b70Schristos
54649a906b70Schristos				if (size > num_pages(bo) || num_pages(bo) > 2*size)
54659a906b70Schristos					continue;
54669a906b70Schristos
54679a906b70Schristos				if (flags & CREATE_INACTIVE && bo->rq)
54689a906b70Schristos					continue;
54699a906b70Schristos
54709a906b70Schristos				list_del(&bo->list);
54719a906b70Schristos
54729a906b70Schristos				if (bo->tiling != tiling || bo->pitch != pitch) {
54739a906b70Schristos					if (bo->delta) {
54749a906b70Schristos						kgem_bo_rmfb(kgem, bo);
54759a906b70Schristos						bo->delta = 0;
54769a906b70Schristos					}
54779a906b70Schristos
547863ef14f0Smrg					if (!kgem_set_tiling(kgem, bo,
547963ef14f0Smrg							     tiling, pitch)) {
548063ef14f0Smrg						bo->scanout = false;
548163ef14f0Smrg						__kgem_bo_destroy(kgem, bo);
54829a906b70Schristos						break;
54839a906b70Schristos					}
54849a906b70Schristos				}
54859a906b70Schristos
54869a906b70Schristos				VG_CLEAR(arg);
54879a906b70Schristos				arg.width = width;
54889a906b70Schristos				arg.height = height;
54899a906b70Schristos				arg.pitch = bo->pitch;
54909a906b70Schristos				arg.bpp = scrn->bitsPerPixel;
54919a906b70Schristos				arg.depth = scrn->depth;
54929a906b70Schristos				arg.handle = bo->handle;
54939a906b70Schristos
54949a906b70Schristos				if (do_ioctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &arg)) {
549563ef14f0Smrg					bo->scanout = false;
549663ef14f0Smrg					__kgem_bo_destroy(kgem, bo);
54979a906b70Schristos					break;
54989a906b70Schristos				}
54999a906b70Schristos
55009a906b70Schristos				bo->delta = arg.fb_id;
55019a906b70Schristos				bo->unique_id = kgem_get_unique_id(kgem);
55029a906b70Schristos
55039a906b70Schristos				DBG(("  2:from scanout: pitch=%d, tiling=%d, handle=%d, id=%d\n",
55049a906b70Schristos				     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
55059a906b70Schristos				assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
55069a906b70Schristos				assert_tiling(kgem, bo);
55079a906b70Schristos				bo->refcnt = 1;
55089a906b70Schristos				return bo;
55099a906b70Schristos			}
55109a906b70Schristos		}
55119a906b70Schristos
551263ef14f0Smrg		if (flags & CREATE_CACHED)
551363ef14f0Smrg			return NULL;
551463ef14f0Smrg
551503b705cfSriastradh		bo = __kgem_bo_create_as_display(kgem, size, tiling, pitch);
551603b705cfSriastradh		if (bo)
551703b705cfSriastradh			return bo;
55189a906b70Schristos
55199a906b70Schristos		flags |= CREATE_INACTIVE;
552003b705cfSriastradh	}
552103b705cfSriastradh
552203b705cfSriastradh	if (bucket >= NUM_CACHE_BUCKETS) {
552303b705cfSriastradh		DBG(("%s: large bo num pages=%d, bucket=%d\n",
552403b705cfSriastradh		     __FUNCTION__, size, bucket));
552503b705cfSriastradh
552603b705cfSriastradh		if (flags & CREATE_INACTIVE)
552703b705cfSriastradh			goto large_inactive;
552803b705cfSriastradh
552903b705cfSriastradh		tiled_height = kgem_aligned_height(kgem, height, tiling);
553003b705cfSriastradh
553103b705cfSriastradh		list_for_each_entry(bo, &kgem->large, list) {
553203b705cfSriastradh			assert(!bo->purged);
553303b705cfSriastradh			assert(!bo->scanout);
553403b705cfSriastradh			assert(bo->refcnt == 0);
553503b705cfSriastradh			assert(bo->reusable);
553603b705cfSriastradh			assert_tiling(kgem, bo);
553703b705cfSriastradh
553803b705cfSriastradh			if (kgem->gen < 040) {
553903b705cfSriastradh				if (bo->pitch < pitch) {
554003b705cfSriastradh					DBG(("tiled and pitch too small: tiling=%d, (want %d), pitch=%d, need %d\n",
554103b705cfSriastradh					     bo->tiling, tiling,
554203b705cfSriastradh					     bo->pitch, pitch));
554303b705cfSriastradh					continue;
554403b705cfSriastradh				}
554503b705cfSriastradh
554603b705cfSriastradh				if (bo->pitch * tiled_height > bytes(bo))
554703b705cfSriastradh					continue;
554803b705cfSriastradh			} else {
554903b705cfSriastradh				if (num_pages(bo) < size)
555003b705cfSriastradh					continue;
555103b705cfSriastradh
555263ef14f0Smrg				if (!kgem_set_tiling(kgem, bo, tiling, pitch)) {
555363ef14f0Smrg					if (exact) {
555463ef14f0Smrg						DBG(("tiled and pitch not exact: tiling=%d, (want %d), pitch=%d, need %d\n",
555563ef14f0Smrg						     bo->tiling, tiling,
555663ef14f0Smrg						     bo->pitch, pitch));
555703b705cfSriastradh						continue;
555863ef14f0Smrg					}
555903b705cfSriastradh
556063ef14f0Smrg					set_gpu_tiling(kgem, bo, tiling, pitch);
556103b705cfSriastradh				}
556203b705cfSriastradh			}
556303b705cfSriastradh
556403b705cfSriastradh			kgem_bo_remove_from_active(kgem, bo);
556503b705cfSriastradh
556603b705cfSriastradh			bo->unique_id = kgem_get_unique_id(kgem);
556703b705cfSriastradh			bo->delta = 0;
556803b705cfSriastradh			DBG(("  1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n",
556903b705cfSriastradh			     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
557003b705cfSriastradh			assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
557103b705cfSriastradh			assert_tiling(kgem, bo);
557203b705cfSriastradh			bo->refcnt = 1;
557303b705cfSriastradh			return bo;
557403b705cfSriastradh		}
557503b705cfSriastradh
557603b705cfSriastradhlarge_inactive:
557703b705cfSriastradh		__kgem_throttle_retire(kgem, flags);
557803b705cfSriastradh		list_for_each_entry(bo, &kgem->large_inactive, list) {
557903b705cfSriastradh			assert(bo->refcnt == 0);
558003b705cfSriastradh			assert(bo->reusable);
558103b705cfSriastradh			assert(!bo->scanout);
558203b705cfSriastradh			assert_tiling(kgem, bo);
558303b705cfSriastradh
558403b705cfSriastradh			if (size > num_pages(bo))
558503b705cfSriastradh				continue;
558603b705cfSriastradh
558763ef14f0Smrg			if (!kgem_set_tiling(kgem, bo, tiling, pitch)) {
558863ef14f0Smrg				if (kgem->gen >= 040 && !exact)
558963ef14f0Smrg					set_gpu_tiling(kgem, bo, tiling, pitch);
559063ef14f0Smrg				else
559103b705cfSriastradh					continue;
559203b705cfSriastradh			}
559303b705cfSriastradh
559403b705cfSriastradh			if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) {
559503b705cfSriastradh				kgem_bo_free(kgem, bo);
559603b705cfSriastradh				break;
559703b705cfSriastradh			}
559803b705cfSriastradh
559903b705cfSriastradh			list_del(&bo->list);
560003b705cfSriastradh
560103b705cfSriastradh			assert(bo->domain != DOMAIN_GPU);
560203b705cfSriastradh			bo->unique_id = kgem_get_unique_id(kgem);
560303b705cfSriastradh			bo->delta = 0;
560403b705cfSriastradh			DBG(("  1:from large inactive: pitch=%d, tiling=%d, handle=%d, id=%d\n",
560503b705cfSriastradh			     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
560603b705cfSriastradh			assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
560703b705cfSriastradh			assert_tiling(kgem, bo);
560803b705cfSriastradh			bo->refcnt = 1;
56099a906b70Schristos
56109a906b70Schristos			if (flags & CREATE_SCANOUT)
56119a906b70Schristos				__kgem_bo_make_scanout(kgem, bo, width, height);
56129a906b70Schristos
561303b705cfSriastradh			return bo;
561403b705cfSriastradh		}
561503b705cfSriastradh
561603b705cfSriastradh		goto create;
561703b705cfSriastradh	}
561803b705cfSriastradh
561903b705cfSriastradh	if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) {
562003b705cfSriastradh		int for_cpu = !!(flags & CREATE_CPU_MAP);
562103b705cfSriastradh		if (kgem->has_llc && tiling == I915_TILING_NONE)
562203b705cfSriastradh			for_cpu = 1;
562303b705cfSriastradh		/* We presume that we will need to upload to this bo,
562403b705cfSriastradh		 * and so would prefer to have an active VMA.
562503b705cfSriastradh		 */
562603b705cfSriastradh		cache = &kgem->vma[for_cpu].inactive[bucket];
562703b705cfSriastradh		do {
562803b705cfSriastradh			list_for_each_entry(bo, cache, vma) {
562903b705cfSriastradh				assert(bucket(bo) == bucket);
563003b705cfSriastradh				assert(bo->refcnt == 0);
563103b705cfSriastradh				assert(!bo->scanout);
5632813957e3Ssnj				assert(for_cpu ? !!bo->map__cpu : (bo->map__gtt || bo->map__wc));
563303b705cfSriastradh				assert(bo->rq == NULL);
56349a906b70Schristos				assert(bo->exec == NULL);
563503b705cfSriastradh				assert(list_is_empty(&bo->request));
563603b705cfSriastradh				assert(bo->flush == false);
563703b705cfSriastradh				assert_tiling(kgem, bo);
563803b705cfSriastradh
563903b705cfSriastradh				if (size > num_pages(bo)) {
564003b705cfSriastradh					DBG(("inactive too small: %d < %d\n",
564103b705cfSriastradh					     num_pages(bo), size));
564203b705cfSriastradh					continue;
564303b705cfSriastradh				}
564403b705cfSriastradh
56459a906b70Schristos				if (flags & UNCACHED && !kgem->has_llc && bo->domain != DOMAIN_CPU)
56469a906b70Schristos					continue;
56479a906b70Schristos
564803b705cfSriastradh				if (bo->tiling != tiling ||
564903b705cfSriastradh				    (tiling != I915_TILING_NONE && bo->pitch != pitch)) {
56509a906b70Schristos					if (bo->map__gtt ||
565163ef14f0Smrg					    !kgem_set_tiling(kgem, bo,
565263ef14f0Smrg							     tiling, pitch)) {
56539a906b70Schristos						DBG(("inactive GTT vma with wrong tiling: %d < %d\n",
56549a906b70Schristos						     bo->tiling, tiling));
565563ef14f0Smrg						kgem_bo_free(kgem, bo);
565663ef14f0Smrg						break;
56579a906b70Schristos					}
565803b705cfSriastradh				}
565903b705cfSriastradh
566003b705cfSriastradh				if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) {
566103b705cfSriastradh					kgem_bo_free(kgem, bo);
566203b705cfSriastradh					break;
566303b705cfSriastradh				}
566403b705cfSriastradh
566563ef14f0Smrg				if (tiling == I915_TILING_NONE)
566663ef14f0Smrg					bo->pitch = pitch;
566763ef14f0Smrg
566803b705cfSriastradh				assert(bo->tiling == tiling);
566963ef14f0Smrg				assert(bo->pitch >= pitch);
567003b705cfSriastradh				bo->delta = 0;
567103b705cfSriastradh				bo->unique_id = kgem_get_unique_id(kgem);
567203b705cfSriastradh
567303b705cfSriastradh				kgem_bo_remove_from_inactive(kgem, bo);
56749a906b70Schristos				assert(list_is_empty(&bo->list));
56759a906b70Schristos				assert(list_is_empty(&bo->vma));
567603b705cfSriastradh
567703b705cfSriastradh				DBG(("  from inactive vma: pitch=%d, tiling=%d: handle=%d, id=%d\n",
567803b705cfSriastradh				     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
567903b705cfSriastradh				assert(bo->reusable);
568003b705cfSriastradh				assert(bo->domain != DOMAIN_GPU);
568103b705cfSriastradh				ASSERT_IDLE(kgem, bo->handle);
568203b705cfSriastradh				assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
568303b705cfSriastradh				assert_tiling(kgem, bo);
568403b705cfSriastradh				bo->refcnt = 1;
568503b705cfSriastradh				return bo;
568603b705cfSriastradh			}
568703b705cfSriastradh		} while (!list_is_empty(cache) &&
568803b705cfSriastradh			 __kgem_throttle_retire(kgem, flags));
568903b705cfSriastradh
569003b705cfSriastradh		if (flags & CREATE_CPU_MAP && !kgem->has_llc) {
569103b705cfSriastradh			if (list_is_empty(&kgem->active[bucket][tiling]) &&
569203b705cfSriastradh			    list_is_empty(&kgem->inactive[bucket]))
569303b705cfSriastradh				flags &= ~CREATE_CACHED;
569403b705cfSriastradh
569503b705cfSriastradh			goto create;
569603b705cfSriastradh		}
569703b705cfSriastradh	}
569803b705cfSriastradh
569903b705cfSriastradh	if (flags & CREATE_INACTIVE)
570003b705cfSriastradh		goto skip_active_search;
570103b705cfSriastradh
570203b705cfSriastradh	/* Best active match */
570303b705cfSriastradh	retry = NUM_CACHE_BUCKETS - bucket;
570403b705cfSriastradh	if (retry > 3 && (flags & CREATE_TEMPORARY) == 0)
570503b705cfSriastradh		retry = 3;
57069a906b70Schristossearch_active:
570703b705cfSriastradh	assert(bucket < NUM_CACHE_BUCKETS);
570803b705cfSriastradh	cache = &kgem->active[bucket][tiling];
570903b705cfSriastradh	if (tiling) {
571003b705cfSriastradh		tiled_height = kgem_aligned_height(kgem, height, tiling);
571103b705cfSriastradh		list_for_each_entry(bo, cache, list) {
571203b705cfSriastradh			assert(!bo->purged);
571303b705cfSriastradh			assert(bo->refcnt == 0);
571403b705cfSriastradh			assert(bucket(bo) == bucket);
571503b705cfSriastradh			assert(bo->reusable);
571603b705cfSriastradh			assert(bo->tiling == tiling);
571703b705cfSriastradh			assert(bo->flush == false);
571803b705cfSriastradh			assert(!bo->scanout);
571903b705cfSriastradh			assert_tiling(kgem, bo);
572003b705cfSriastradh
572103b705cfSriastradh			if (kgem->gen < 040) {
572203b705cfSriastradh				if (bo->pitch < pitch) {
572303b705cfSriastradh					DBG(("tiled and pitch too small: tiling=%d, (want %d), pitch=%d, need %d\n",
572403b705cfSriastradh					     bo->tiling, tiling,
572503b705cfSriastradh					     bo->pitch, pitch));
572603b705cfSriastradh					continue;
572703b705cfSriastradh				}
572803b705cfSriastradh
572903b705cfSriastradh				if (bo->pitch * tiled_height > bytes(bo))
573003b705cfSriastradh					continue;
573103b705cfSriastradh			} else {
573203b705cfSriastradh				if (num_pages(bo) < size)
573303b705cfSriastradh					continue;
573403b705cfSriastradh
573563ef14f0Smrg				if (!kgem_set_tiling(kgem, bo, tiling, pitch)) {
573663ef14f0Smrg					if (exact) {
573763ef14f0Smrg						DBG(("tiled and pitch not exact: tiling=%d, (want %d), pitch=%d, need %d\n",
573863ef14f0Smrg						     bo->tiling, tiling,
573963ef14f0Smrg						     bo->pitch, pitch));
574003b705cfSriastradh						continue;
574163ef14f0Smrg					}
574203b705cfSriastradh
574363ef14f0Smrg					set_gpu_tiling(kgem, bo, tiling, pitch);
574403b705cfSriastradh				}
574503b705cfSriastradh			}
574663ef14f0Smrg			assert(bo->tiling == tiling);
574763ef14f0Smrg			assert(bo->pitch >= pitch);
574803b705cfSriastradh
574903b705cfSriastradh			kgem_bo_remove_from_active(kgem, bo);
575003b705cfSriastradh
575103b705cfSriastradh			bo->unique_id = kgem_get_unique_id(kgem);
575203b705cfSriastradh			bo->delta = 0;
575303b705cfSriastradh			DBG(("  1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n",
575403b705cfSriastradh			     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
575503b705cfSriastradh			assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
575603b705cfSriastradh			assert_tiling(kgem, bo);
575703b705cfSriastradh			bo->refcnt = 1;
575803b705cfSriastradh			return bo;
575903b705cfSriastradh		}
576003b705cfSriastradh	} else {
576103b705cfSriastradh		list_for_each_entry(bo, cache, list) {
576203b705cfSriastradh			assert(bucket(bo) == bucket);
576303b705cfSriastradh			assert(!bo->purged);
576403b705cfSriastradh			assert(bo->refcnt == 0);
576503b705cfSriastradh			assert(bo->reusable);
576603b705cfSriastradh			assert(!bo->scanout);
576703b705cfSriastradh			assert(bo->tiling == tiling);
576803b705cfSriastradh			assert(bo->flush == false);
576903b705cfSriastradh			assert_tiling(kgem, bo);
577003b705cfSriastradh
577103b705cfSriastradh			if (num_pages(bo) < size)
577203b705cfSriastradh				continue;
577303b705cfSriastradh
577403b705cfSriastradh			kgem_bo_remove_from_active(kgem, bo);
577503b705cfSriastradh
577603b705cfSriastradh			bo->pitch = pitch;
577703b705cfSriastradh			bo->unique_id = kgem_get_unique_id(kgem);
577803b705cfSriastradh			bo->delta = 0;
577903b705cfSriastradh			DBG(("  1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n",
578003b705cfSriastradh			     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
578103b705cfSriastradh			assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
578203b705cfSriastradh			assert_tiling(kgem, bo);
578303b705cfSriastradh			bo->refcnt = 1;
578403b705cfSriastradh			return bo;
578503b705cfSriastradh		}
578603b705cfSriastradh	}
578703b705cfSriastradh
57889a906b70Schristos	if (kgem->gen >= 040) {
57899a906b70Schristos		for (i = I915_TILING_Y; i >= I915_TILING_NONE; i--) {
57909a906b70Schristos			cache = &kgem->active[bucket][i];
57919a906b70Schristos			list_for_each_entry(bo, cache, list) {
57929a906b70Schristos				assert(!bo->purged);
57939a906b70Schristos				assert(bo->refcnt == 0);
57949a906b70Schristos				assert(bo->reusable);
57959a906b70Schristos				assert(!bo->scanout);
57969a906b70Schristos				assert(bo->flush == false);
57979a906b70Schristos				assert_tiling(kgem, bo);
579803b705cfSriastradh
57999a906b70Schristos				if (num_pages(bo) < size)
58009a906b70Schristos					continue;
580103b705cfSriastradh
580263ef14f0Smrg				if (!kgem_set_tiling(kgem, bo, tiling, pitch)) {
580363ef14f0Smrg					if (exact || kgem->gen < 040)
580403b705cfSriastradh						continue;
580563ef14f0Smrg
580663ef14f0Smrg					set_gpu_tiling(kgem, bo, tiling, pitch);
58079a906b70Schristos				}
580863ef14f0Smrg				assert(bo->tiling == tiling);
580963ef14f0Smrg				assert(bo->pitch >= pitch);
581003b705cfSriastradh
58119a906b70Schristos				kgem_bo_remove_from_active(kgem, bo);
581203b705cfSriastradh
58139a906b70Schristos				bo->unique_id = kgem_get_unique_id(kgem);
58149a906b70Schristos				bo->delta = 0;
58159a906b70Schristos				DBG(("  1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n",
58169a906b70Schristos				     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
58179a906b70Schristos				assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
58189a906b70Schristos				assert_tiling(kgem, bo);
58199a906b70Schristos				bo->refcnt = 1;
58209a906b70Schristos				return bo;
582103b705cfSriastradh			}
582203b705cfSriastradh		}
58239a906b70Schristos	} else if (!exact) { /* allow an active near-miss? */
58249a906b70Schristos		for (i = tiling; i >= I915_TILING_NONE; i--) {
582503b705cfSriastradh			tiled_height = kgem_surface_size(kgem, kgem->has_relaxed_fencing, flags,
582603b705cfSriastradh							 width, height, bpp, tiling, &pitch);
582703b705cfSriastradh			cache = active(kgem, tiled_height / PAGE_SIZE, i);
582803b705cfSriastradh			tiled_height = kgem_aligned_height(kgem, height, i);
582903b705cfSriastradh			list_for_each_entry(bo, cache, list) {
583003b705cfSriastradh				assert(!bo->purged);
583103b705cfSriastradh				assert(bo->refcnt == 0);
583203b705cfSriastradh				assert(bo->reusable);
583303b705cfSriastradh				assert(!bo->scanout);
583403b705cfSriastradh				assert(bo->flush == false);
583503b705cfSriastradh				assert_tiling(kgem, bo);
583603b705cfSriastradh
583703b705cfSriastradh				if (bo->tiling) {
583803b705cfSriastradh					if (bo->pitch < pitch) {
583903b705cfSriastradh						DBG(("tiled and pitch too small: tiling=%d, (want %d), pitch=%d, need %d\n",
584003b705cfSriastradh						     bo->tiling, tiling,
584103b705cfSriastradh						     bo->pitch, pitch));
584203b705cfSriastradh						continue;
584303b705cfSriastradh					}
584403b705cfSriastradh				} else
584503b705cfSriastradh					bo->pitch = pitch;
584603b705cfSriastradh
584703b705cfSriastradh				if (bo->pitch * tiled_height > bytes(bo))
584803b705cfSriastradh					continue;
584903b705cfSriastradh
585003b705cfSriastradh				kgem_bo_remove_from_active(kgem, bo);
585103b705cfSriastradh
585203b705cfSriastradh				bo->unique_id = kgem_get_unique_id(kgem);
585303b705cfSriastradh				bo->delta = 0;
585403b705cfSriastradh				DBG(("  1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n",
585503b705cfSriastradh				     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
585603b705cfSriastradh				assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
585703b705cfSriastradh				assert_tiling(kgem, bo);
585803b705cfSriastradh				bo->refcnt = 1;
585903b705cfSriastradh				return bo;
586003b705cfSriastradh			}
586103b705cfSriastradh		}
586203b705cfSriastradh	}
586303b705cfSriastradh
58649a906b70Schristos	if (--retry) {
58659a906b70Schristos		bucket++;
58669a906b70Schristos		goto search_active;
58679a906b70Schristos	}
58689a906b70Schristos
586903b705cfSriastradhskip_active_search:
587003b705cfSriastradh	bucket = cache_bucket(size);
587103b705cfSriastradh	retry = NUM_CACHE_BUCKETS - bucket;
587203b705cfSriastradh	if (retry > 3)
587303b705cfSriastradh		retry = 3;
587403b705cfSriastradhsearch_inactive:
587503b705cfSriastradh	/* Now just look for a close match and prefer any currently active */
587603b705cfSriastradh	assert(bucket < NUM_CACHE_BUCKETS);
587703b705cfSriastradh	cache = &kgem->inactive[bucket];
587803b705cfSriastradh	list_for_each_entry(bo, cache, list) {
587903b705cfSriastradh		assert(bucket(bo) == bucket);
588003b705cfSriastradh		assert(bo->reusable);
588103b705cfSriastradh		assert(!bo->scanout);
588203b705cfSriastradh		assert(bo->flush == false);
588303b705cfSriastradh		assert_tiling(kgem, bo);
588403b705cfSriastradh
588503b705cfSriastradh		if (size > num_pages(bo)) {
588603b705cfSriastradh			DBG(("inactive too small: %d < %d\n",
588703b705cfSriastradh			     num_pages(bo), size));
588803b705cfSriastradh			continue;
588903b705cfSriastradh		}
589003b705cfSriastradh
589163ef14f0Smrg		if (!kgem_set_tiling(kgem, bo, tiling, pitch)) {
589263ef14f0Smrg			if (exact || kgem->gen < 040) {
589363ef14f0Smrg				kgem_bo_free(kgem, bo);
589463ef14f0Smrg				break;
589563ef14f0Smrg			}
589663ef14f0Smrg
589763ef14f0Smrg			set_gpu_tiling(kgem, bo, tiling, pitch);
589803b705cfSriastradh		}
589903b705cfSriastradh
590003b705cfSriastradh		if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) {
590103b705cfSriastradh			kgem_bo_free(kgem, bo);
590203b705cfSriastradh			break;
590303b705cfSriastradh		}
590403b705cfSriastradh
590503b705cfSriastradh		kgem_bo_remove_from_inactive(kgem, bo);
59069a906b70Schristos		assert(list_is_empty(&bo->list));
59079a906b70Schristos		assert(list_is_empty(&bo->vma));
590863ef14f0Smrg		assert(bo->tiling == tiling);
590963ef14f0Smrg		assert(bo->pitch >= pitch);
591003b705cfSriastradh
591103b705cfSriastradh		bo->delta = 0;
591203b705cfSriastradh		bo->unique_id = kgem_get_unique_id(kgem);
591303b705cfSriastradh		assert(bo->pitch);
591403b705cfSriastradh		DBG(("  from inactive: pitch=%d, tiling=%d: handle=%d, id=%d\n",
591503b705cfSriastradh		     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
591603b705cfSriastradh		assert(bo->refcnt == 0);
591703b705cfSriastradh		assert(bo->reusable);
591803b705cfSriastradh		assert((flags & CREATE_INACTIVE) == 0 || bo->domain != DOMAIN_GPU);
591903b705cfSriastradh		ASSERT_MAYBE_IDLE(kgem, bo->handle, flags & CREATE_INACTIVE);
592003b705cfSriastradh		assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
592103b705cfSriastradh		assert_tiling(kgem, bo);
592203b705cfSriastradh		bo->refcnt = 1;
59239a906b70Schristos
59249a906b70Schristos		if (flags & CREATE_SCANOUT)
59259a906b70Schristos			__kgem_bo_make_scanout(kgem, bo, width, height);
59269a906b70Schristos
592703b705cfSriastradh		return bo;
592803b705cfSriastradh	}
592903b705cfSriastradh
59309a906b70Schristos	if ((flags & CREATE_NO_RETIRE) == 0) {
59319a906b70Schristos		list_for_each_entry_reverse(bo, &kgem->active[bucket][tiling], list) {
59329a906b70Schristos			if (bo->exec)
59339a906b70Schristos				break;
59349a906b70Schristos
59359a906b70Schristos			if (size > num_pages(bo))
59369a906b70Schristos				continue;
59379a906b70Schristos
59389a906b70Schristos			if (__kgem_busy(kgem, bo->handle)) {
59399a906b70Schristos				if (flags & CREATE_NO_THROTTLE)
59409a906b70Schristos					goto no_retire;
59419a906b70Schristos
59429a906b70Schristos				do {
59439a906b70Schristos					if (!kgem->need_throttle) {
59449a906b70Schristos						DBG(("%s: not throttling for active handle=%d\n", __FUNCTION__, bo->handle));
59459a906b70Schristos						goto no_retire;
59469a906b70Schristos					}
59479a906b70Schristos
59489a906b70Schristos					__kgem_throttle(kgem, false);
59499a906b70Schristos				} while (__kgem_busy(kgem, bo->handle));
59509a906b70Schristos			}
59519a906b70Schristos
59529a906b70Schristos			DBG(("%s: flushed active handle=%d\n", __FUNCTION__, bo->handle));
59539a906b70Schristos
59549a906b70Schristos			kgem_bo_remove_from_active(kgem, bo);
59559a906b70Schristos			__kgem_bo_clear_busy(bo);
59569a906b70Schristos
595763ef14f0Smrg			if (!kgem_set_tiling(kgem, bo, tiling, pitch)) {
595863ef14f0Smrg				if (exact || kgem->gen < 040)
59599a906b70Schristos					goto no_retire;
596063ef14f0Smrg
596163ef14f0Smrg				set_gpu_tiling(kgem, bo, tiling, pitch);
59629a906b70Schristos			}
596363ef14f0Smrg			assert(bo->tiling == tiling);
596463ef14f0Smrg			assert(bo->pitch >= pitch);
59659a906b70Schristos
59669a906b70Schristos			bo->unique_id = kgem_get_unique_id(kgem);
59679a906b70Schristos			bo->delta = 0;
59689a906b70Schristos			DBG(("  2:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n",
59699a906b70Schristos			     bo->pitch, bo->tiling, bo->handle, bo->unique_id));
59709a906b70Schristos			assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo));
59719a906b70Schristos			assert_tiling(kgem, bo);
59729a906b70Schristos			bo->refcnt = 1;
59739a906b70Schristos
59749a906b70Schristos			if (flags & CREATE_SCANOUT)
59759a906b70Schristos				__kgem_bo_make_scanout(kgem, bo, width, height);
59769a906b70Schristos
59779a906b70Schristos			return bo;
59789a906b70Schristos		}
59799a906b70Schristosno_retire:
59809a906b70Schristos		flags |= CREATE_NO_RETIRE;
598103b705cfSriastradh	}
598203b705cfSriastradh
598303b705cfSriastradh	if (--retry) {
598403b705cfSriastradh		bucket++;
598503b705cfSriastradh		goto search_inactive;
598603b705cfSriastradh	}
598703b705cfSriastradh
598803b705cfSriastradhcreate:
59899a906b70Schristos	if (flags & CREATE_CACHED) {
59909a906b70Schristos		DBG(("%s: no cached bo found, requested not to create a new bo\n", __FUNCTION__));
599103b705cfSriastradh		return NULL;
59929a906b70Schristos	}
599303b705cfSriastradh
599403b705cfSriastradh	if (bucket >= NUM_CACHE_BUCKETS)
599503b705cfSriastradh		size = ALIGN(size, 1024);
599603b705cfSriastradh	handle = gem_create(kgem->fd, size);
59979a906b70Schristos	if (handle == 0) {
59989a906b70Schristos		DBG(("%s: kernel allocation (gem_create) failure\n", __FUNCTION__));
599903b705cfSriastradh		return NULL;
60009a906b70Schristos	}
600103b705cfSriastradh
600203b705cfSriastradh	bo = __kgem_bo_alloc(handle, size);
600303b705cfSriastradh	if (!bo) {
60049a906b70Schristos		DBG(("%s: malloc failed\n", __FUNCTION__));
600503b705cfSriastradh		gem_close(kgem->fd, handle);
600603b705cfSriastradh		return NULL;
600703b705cfSriastradh	}
600803b705cfSriastradh
600903b705cfSriastradh	bo->unique_id = kgem_get_unique_id(kgem);
601063ef14f0Smrg	if (kgem_set_tiling(kgem, bo, tiling, pitch)) {
60119a906b70Schristos		if (flags & CREATE_SCANOUT)
60129a906b70Schristos			__kgem_bo_make_scanout(kgem, bo, width, height);
601303b705cfSriastradh	} else {
601463ef14f0Smrg		if (kgem->gen >= 040) {
601563ef14f0Smrg			assert(!kgem->can_fence);
601663ef14f0Smrg			bo->tiling = tiling;
601763ef14f0Smrg			bo->pitch = pitch;
601863ef14f0Smrg		} else {
601963ef14f0Smrg			if (flags & CREATE_EXACT) {
602063ef14f0Smrg				DBG(("%s: failed to set exact tiling (gem_set_tiling)\n", __FUNCTION__));
602163ef14f0Smrg				gem_close(kgem->fd, handle);
602263ef14f0Smrg				free(bo);
602363ef14f0Smrg				return NULL;
602463ef14f0Smrg			}
602503b705cfSriastradh		}
602603b705cfSriastradh	}
602703b705cfSriastradh
602803b705cfSriastradh	assert(bytes(bo) >= bo->pitch * kgem_aligned_height(kgem, height, bo->tiling));
602903b705cfSriastradh	assert_tiling(kgem, bo);
603003b705cfSriastradh
603103b705cfSriastradh	debug_alloc__bo(kgem, bo);
603203b705cfSriastradh
603303b705cfSriastradh	DBG(("  new pitch=%d, tiling=%d, handle=%d, id=%d, num_pages=%d [%d], bucket=%d\n",
603403b705cfSriastradh	     bo->pitch, bo->tiling, bo->handle, bo->unique_id,
603503b705cfSriastradh	     size, num_pages(bo), bucket(bo)));
603603b705cfSriastradh	return bo;
603703b705cfSriastradh}
603803b705cfSriastradh
603903b705cfSriastradhstruct kgem_bo *kgem_create_cpu_2d(struct kgem *kgem,
604003b705cfSriastradh				   int width,
604103b705cfSriastradh				   int height,
604203b705cfSriastradh				   int bpp,
604303b705cfSriastradh				   uint32_t flags)
604403b705cfSriastradh{
604503b705cfSriastradh	struct kgem_bo *bo;
604603b705cfSriastradh	int stride, size;
604703b705cfSriastradh
604803b705cfSriastradh	if (DBG_NO_CPU)
604903b705cfSriastradh		return NULL;
605003b705cfSriastradh
605103b705cfSriastradh	DBG(("%s(%dx%d, bpp=%d)\n", __FUNCTION__, width, height, bpp));
605203b705cfSriastradh
605303b705cfSriastradh	if (kgem->has_llc) {
605403b705cfSriastradh		bo = kgem_create_2d(kgem, width, height, bpp,
605503b705cfSriastradh				    I915_TILING_NONE, flags);
605603b705cfSriastradh		if (bo == NULL)
605703b705cfSriastradh			return bo;
605803b705cfSriastradh
605903b705cfSriastradh		assert(bo->tiling == I915_TILING_NONE);
606003b705cfSriastradh		assert_tiling(kgem, bo);
606103b705cfSriastradh
606203b705cfSriastradh		if (kgem_bo_map__cpu(kgem, bo) == NULL) {
606303b705cfSriastradh			kgem_bo_destroy(kgem, bo);
606403b705cfSriastradh			return NULL;
606503b705cfSriastradh		}
606603b705cfSriastradh
606703b705cfSriastradh		return bo;
606803b705cfSriastradh	}
606903b705cfSriastradh
607003b705cfSriastradh	assert(width > 0 && height > 0);
607103b705cfSriastradh	stride = ALIGN(width, 2) * bpp >> 3;
607203b705cfSriastradh	stride = ALIGN(stride, 4);
607303b705cfSriastradh	size = stride * ALIGN(height, 2);
607403b705cfSriastradh	assert(size >= PAGE_SIZE);
607503b705cfSriastradh
607603b705cfSriastradh	DBG(("%s: %dx%d, %d bpp, stride=%d\n",
607703b705cfSriastradh	     __FUNCTION__, width, height, bpp, stride));
607803b705cfSriastradh
607903b705cfSriastradh	bo = search_snoop_cache(kgem, NUM_PAGES(size), 0);
608003b705cfSriastradh	if (bo) {
608103b705cfSriastradh		assert(bo->tiling == I915_TILING_NONE);
608203b705cfSriastradh		assert_tiling(kgem, bo);
608303b705cfSriastradh		assert(bo->snoop);
608403b705cfSriastradh		bo->refcnt = 1;
608503b705cfSriastradh		bo->pitch = stride;
608603b705cfSriastradh		bo->unique_id = kgem_get_unique_id(kgem);
608703b705cfSriastradh		return bo;
608803b705cfSriastradh	}
608903b705cfSriastradh
609003b705cfSriastradh	if (kgem->has_caching) {
609103b705cfSriastradh		bo = kgem_create_linear(kgem, size, flags);
609203b705cfSriastradh		if (bo == NULL)
609303b705cfSriastradh			return NULL;
609403b705cfSriastradh
609503b705cfSriastradh		assert(bo->tiling == I915_TILING_NONE);
609603b705cfSriastradh		assert_tiling(kgem, bo);
609703b705cfSriastradh
6098813957e3Ssnj		assert(!__kgem_busy(kgem, bo->handle));
609903b705cfSriastradh		if (!gem_set_caching(kgem->fd, bo->handle, SNOOPED)) {
610003b705cfSriastradh			kgem_bo_destroy(kgem, bo);
610103b705cfSriastradh			return NULL;
610203b705cfSriastradh		}
610303b705cfSriastradh		bo->snoop = true;
610403b705cfSriastradh
610503b705cfSriastradh		if (kgem_bo_map__cpu(kgem, bo) == NULL) {
610603b705cfSriastradh			kgem_bo_destroy(kgem, bo);
610703b705cfSriastradh			return NULL;
610803b705cfSriastradh		}
610903b705cfSriastradh
611003b705cfSriastradh		bo->pitch = stride;
611103b705cfSriastradh		bo->unique_id = kgem_get_unique_id(kgem);
611203b705cfSriastradh		return bo;
611303b705cfSriastradh	}
611403b705cfSriastradh
611503b705cfSriastradh	if (kgem->has_userptr) {
611603b705cfSriastradh		void *ptr;
611703b705cfSriastradh
611803b705cfSriastradh		/* XXX */
611903b705cfSriastradh		//if (posix_memalign(&ptr, 64, ALIGN(size, 64)))
612003b705cfSriastradh		if (posix_memalign(&ptr, PAGE_SIZE, ALIGN(size, PAGE_SIZE)))
612103b705cfSriastradh			return NULL;
612203b705cfSriastradh
612303b705cfSriastradh		bo = kgem_create_map(kgem, ptr, size, false);
612403b705cfSriastradh		if (bo == NULL) {
612503b705cfSriastradh			free(ptr);
612603b705cfSriastradh			return NULL;
612703b705cfSriastradh		}
612803b705cfSriastradh
612903b705cfSriastradh		bo->pitch = stride;
613003b705cfSriastradh		bo->unique_id = kgem_get_unique_id(kgem);
613103b705cfSriastradh		return bo;
613203b705cfSriastradh	}
613303b705cfSriastradh
613403b705cfSriastradh	return NULL;
613503b705cfSriastradh}
613603b705cfSriastradh
613703b705cfSriastradhvoid _kgem_bo_destroy(struct kgem *kgem, struct kgem_bo *bo)
613803b705cfSriastradh{
613903b705cfSriastradh	DBG(("%s: handle=%d, proxy? %d\n",
614003b705cfSriastradh	     __FUNCTION__, bo->handle, bo->proxy != NULL));
614103b705cfSriastradh
614203b705cfSriastradh	if (bo->proxy) {
61439a906b70Schristos		assert(!bo->reusable);
61449a906b70Schristos		kgem_bo_binding_free(kgem, bo);
61459a906b70Schristos
61469a906b70Schristos		assert(list_is_empty(&bo->list));
614703b705cfSriastradh		_list_del(&bo->vma);
614803b705cfSriastradh		_list_del(&bo->request);
61499a906b70Schristos
61509a906b70Schristos		if (bo->io && bo->domain == DOMAIN_CPU)
615103b705cfSriastradh			_kgem_bo_delete_buffer(kgem, bo);
61529a906b70Schristos
615303b705cfSriastradh		kgem_bo_unref(kgem, bo->proxy);
615403b705cfSriastradh
61559a906b70Schristos		if (DBG_NO_MALLOC_CACHE) {
61569a906b70Schristos			free(bo);
61579a906b70Schristos		} else {
61589a906b70Schristos			*(struct kgem_bo **)bo = __kgem_freed_bo;
61599a906b70Schristos			__kgem_freed_bo = bo;
61609a906b70Schristos		}
61619a906b70Schristos	} else
61629a906b70Schristos		__kgem_bo_destroy(kgem, bo);
616303b705cfSriastradh}
616403b705cfSriastradh
616503b705cfSriastradhstatic void __kgem_flush(struct kgem *kgem, struct kgem_bo *bo)
616603b705cfSriastradh{
616703b705cfSriastradh	assert(bo->rq);
616803b705cfSriastradh	assert(bo->exec == NULL);
616903b705cfSriastradh	assert(bo->needs_flush);
617003b705cfSriastradh
617103b705cfSriastradh	/* The kernel will emit a flush *and* update its own flushing lists. */
617203b705cfSriastradh	if (!__kgem_busy(kgem, bo->handle))
617303b705cfSriastradh		__kgem_bo_clear_busy(bo);
617403b705cfSriastradh
617503b705cfSriastradh	DBG(("%s: handle=%d, busy?=%d\n",
617603b705cfSriastradh	     __FUNCTION__, bo->handle, bo->rq != NULL));
617703b705cfSriastradh}
617803b705cfSriastradh
617903b705cfSriastradhvoid kgem_scanout_flush(struct kgem *kgem, struct kgem_bo *bo)
618003b705cfSriastradh{
618163ef14f0Smrg	if (!bo->needs_flush && !bo->gtt_dirty)
618203b705cfSriastradh		return;
618303b705cfSriastradh
61849a906b70Schristos	kgem_bo_submit(kgem, bo);
61859a906b70Schristos
618603b705cfSriastradh	/* If the kernel fails to emit the flush, then it will be forced when
618703b705cfSriastradh	 * we assume direct access. And as the usual failure is EIO, we do
618803b705cfSriastradh	 * not actually care.
618903b705cfSriastradh	 */
619003b705cfSriastradh	assert(bo->exec == NULL);
619103b705cfSriastradh	if (bo->rq)
619203b705cfSriastradh		__kgem_flush(kgem, bo);
619303b705cfSriastradh
619463ef14f0Smrg	if (bo->scanout && kgem->needs_dirtyfb) {
619563ef14f0Smrg		struct drm_mode_fb_dirty_cmd cmd;
619663ef14f0Smrg		memset(&cmd, 0, sizeof(cmd));
619763ef14f0Smrg		cmd.fb_id = bo->delta;
619863ef14f0Smrg		(void)drmIoctl(kgem->fd, DRM_IOCTL_MODE_DIRTYFB, &cmd);
619963ef14f0Smrg	}
620063ef14f0Smrg
620103b705cfSriastradh	/* Whatever actually happens, we can regard the GTT write domain
620203b705cfSriastradh	 * as being flushed.
620303b705cfSriastradh	 */
620463ef14f0Smrg	__kgem_bo_clear_dirty(bo);
620503b705cfSriastradh}
620603b705cfSriastradh
62079a906b70Schristosinline static bool nearly_idle(struct kgem *kgem)
62089a906b70Schristos{
62099a906b70Schristos	int ring = kgem->ring == KGEM_BLT;
62109a906b70Schristos
621163ef14f0Smrg	assert(ring < ARRAY_SIZE(kgem->requests));
62129a906b70Schristos	if (list_is_singular(&kgem->requests[ring]))
62139a906b70Schristos		return true;
62149a906b70Schristos
62159a906b70Schristos	return __kgem_ring_is_idle(kgem, ring);
62169a906b70Schristos}
62179a906b70Schristos
621803b705cfSriastradhinline static bool needs_semaphore(struct kgem *kgem, struct kgem_bo *bo)
621903b705cfSriastradh{
62209a906b70Schristos	if (kgem->needs_semaphore)
62219a906b70Schristos		return false;
62229a906b70Schristos
62239a906b70Schristos	if (bo->rq == NULL || RQ_RING(bo->rq) == kgem->ring)
62249a906b70Schristos		return false;
62259a906b70Schristos
62269a906b70Schristos	kgem->needs_semaphore = true;
62279a906b70Schristos	return true;
62289a906b70Schristos}
62299a906b70Schristos
62309a906b70Schristosinline static bool needs_reservation(struct kgem *kgem, struct kgem_bo *bo)
62319a906b70Schristos{
62329a906b70Schristos	if (kgem->needs_reservation)
62339a906b70Schristos		return false;
62349a906b70Schristos
62359a906b70Schristos	if (bo->presumed_offset)
62369a906b70Schristos		return false;
62379a906b70Schristos
62389a906b70Schristos	kgem->needs_reservation = true;
62399a906b70Schristos	return nearly_idle(kgem);
62409a906b70Schristos}
62419a906b70Schristos
62429a906b70Schristosinline static bool needs_batch_flush(struct kgem *kgem, struct kgem_bo *bo)
62439a906b70Schristos{
62449a906b70Schristos	bool flush = false;
62459a906b70Schristos
62469a906b70Schristos	if (needs_semaphore(kgem, bo)) {
62479a906b70Schristos		DBG(("%s: flushing before handle=%d for required semaphore\n", __FUNCTION__, bo->handle));
62489a906b70Schristos		flush = true;
62499a906b70Schristos	}
62509a906b70Schristos
62519a906b70Schristos	if (needs_reservation(kgem, bo)) {
62529a906b70Schristos		DBG(("%s: flushing before handle=%d for new reservation\n", __FUNCTION__, bo->handle));
62539a906b70Schristos		flush = true;
62549a906b70Schristos	}
62559a906b70Schristos
62569a906b70Schristos	return kgem->nreloc ? flush : false;
62579a906b70Schristos}
62589a906b70Schristos
62599a906b70Schristosstatic bool aperture_check(struct kgem *kgem, unsigned num_pages)
62609a906b70Schristos{
62619a906b70Schristos	struct drm_i915_gem_get_aperture aperture;
62629a906b70Schristos	int reserve;
62639a906b70Schristos
62649a906b70Schristos	if (kgem->aperture)
62659a906b70Schristos		return false;
62669a906b70Schristos
62679a906b70Schristos	/* Leave some space in case of alignment issues */
62689a906b70Schristos	reserve = kgem->aperture_mappable / 2;
62699a906b70Schristos	if (kgem->gen < 033 && reserve < kgem->aperture_max_fence)
62709a906b70Schristos		reserve = kgem->aperture_max_fence;
62719a906b70Schristos	if (!kgem->has_llc)
62729a906b70Schristos		reserve += kgem->nexec * PAGE_SIZE * 2;
62739a906b70Schristos
62749a906b70Schristos	DBG(("%s: num_pages=%d, holding %d pages in reserve, total aperture %d\n",
62759a906b70Schristos	     __FUNCTION__, num_pages, reserve, kgem->aperture_total));
62769a906b70Schristos	num_pages += reserve;
62779a906b70Schristos
62789a906b70Schristos	VG_CLEAR(aperture);
62799a906b70Schristos	aperture.aper_available_size = kgem->aperture_total;
62809a906b70Schristos	aperture.aper_available_size *= PAGE_SIZE;
62819a906b70Schristos	(void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_APERTURE, &aperture);
62829a906b70Schristos
62839a906b70Schristos	DBG(("%s: aperture required %ld bytes, available %ld bytes\n",
62849a906b70Schristos	     __FUNCTION__,
62859a906b70Schristos	     (long)num_pages * PAGE_SIZE,
62869a906b70Schristos	     (long)aperture.aper_available_size));
62879a906b70Schristos
62889a906b70Schristos	return num_pages <= aperture.aper_available_size / PAGE_SIZE;
62899a906b70Schristos}
62909a906b70Schristos
62919a906b70Schristosstatic inline bool kgem_flush(struct kgem *kgem, bool flush)
62929a906b70Schristos{
62939a906b70Schristos	if (unlikely(kgem->wedged))
62949a906b70Schristos		return false;
62959a906b70Schristos
62969a906b70Schristos	if (kgem->nreloc == 0)
62979a906b70Schristos		return true;
62989a906b70Schristos
629963ef14f0Smrg	if (__to_sna(kgem)->flags & SNA_POWERSAVE)
63009a906b70Schristos		return true;
63019a906b70Schristos
63029a906b70Schristos	if (kgem->flush == flush && kgem->aperture < kgem->aperture_low)
63039a906b70Schristos		return true;
63049a906b70Schristos
63059a906b70Schristos	DBG(("%s: opportunistic flushing? flush=%d,%d, aperture=%d/%d, idle?=%d\n",
63069a906b70Schristos	     __FUNCTION__, kgem->flush, flush, kgem->aperture, kgem->aperture_low, kgem_ring_is_idle(kgem, kgem->ring)));
63079a906b70Schristos	return !kgem_ring_is_idle(kgem, kgem->ring);
630803b705cfSriastradh}
630903b705cfSriastradh
631003b705cfSriastradhbool kgem_check_bo(struct kgem *kgem, ...)
631103b705cfSriastradh{
631203b705cfSriastradh	va_list ap;
631303b705cfSriastradh	struct kgem_bo *bo;
631403b705cfSriastradh	int num_exec = 0;
631503b705cfSriastradh	int num_pages = 0;
631603b705cfSriastradh	bool flush = false;
63179a906b70Schristos	bool busy = true;
631803b705cfSriastradh
631903b705cfSriastradh	va_start(ap, kgem);
632003b705cfSriastradh	while ((bo = va_arg(ap, struct kgem_bo *))) {
632103b705cfSriastradh		while (bo->proxy)
632203b705cfSriastradh			bo = bo->proxy;
632303b705cfSriastradh		if (bo->exec)
632403b705cfSriastradh			continue;
632503b705cfSriastradh
63269a906b70Schristos		if (needs_batch_flush(kgem, bo)) {
63279a906b70Schristos			va_end(ap);
632803b705cfSriastradh			return false;
63299a906b70Schristos		}
633003b705cfSriastradh
633103b705cfSriastradh		num_pages += num_pages(bo);
633203b705cfSriastradh		num_exec++;
633303b705cfSriastradh
633403b705cfSriastradh		flush |= bo->flush;
63359a906b70Schristos		busy &= bo->rq != NULL;
633603b705cfSriastradh	}
633703b705cfSriastradh	va_end(ap);
633803b705cfSriastradh
633903b705cfSriastradh	DBG(("%s: num_pages=+%d, num_exec=+%d\n",
634003b705cfSriastradh	     __FUNCTION__, num_pages, num_exec));
634103b705cfSriastradh
634203b705cfSriastradh	if (!num_pages)
634303b705cfSriastradh		return true;
634403b705cfSriastradh
63459a906b70Schristos	if (kgem->nexec + num_exec >= KGEM_EXEC_SIZE(kgem)) {
63469a906b70Schristos		DBG(("%s: out of exec slots (%d + %d / %d)\n", __FUNCTION__,
63479a906b70Schristos		     kgem->nexec, num_exec, KGEM_EXEC_SIZE(kgem)));
634803b705cfSriastradh		return false;
634903b705cfSriastradh	}
635003b705cfSriastradh
635103b705cfSriastradh	if (num_pages + kgem->aperture > kgem->aperture_high) {
63529a906b70Schristos		DBG(("%s: final aperture usage (%d + %d) is greater than high water mark (%d)\n",
63539a906b70Schristos		     __FUNCTION__, kgem->aperture, num_pages, kgem->aperture_high));
63549a906b70Schristos		return aperture_check(kgem, num_pages);
635503b705cfSriastradh	}
635603b705cfSriastradh
63579a906b70Schristos	if (busy)
63589a906b70Schristos		return true;
635903b705cfSriastradh
63609a906b70Schristos	return kgem_flush(kgem, flush);
636103b705cfSriastradh}
636203b705cfSriastradh
636303b705cfSriastradhbool kgem_check_bo_fenced(struct kgem *kgem, struct kgem_bo *bo)
636403b705cfSriastradh{
636503b705cfSriastradh	assert(bo->refcnt);
636603b705cfSriastradh	while (bo->proxy)
636703b705cfSriastradh		bo = bo->proxy;
636803b705cfSriastradh	assert(bo->refcnt);
636903b705cfSriastradh
637003b705cfSriastradh	if (bo->exec) {
637103b705cfSriastradh		if (kgem->gen < 040 &&
637203b705cfSriastradh		    bo->tiling != I915_TILING_NONE &&
637303b705cfSriastradh		    (bo->exec->flags & EXEC_OBJECT_NEEDS_FENCE) == 0) {
63749a906b70Schristos			uint32_t size;
63759a906b70Schristos
63769a906b70Schristos			assert(bo->tiling == I915_TILING_X);
63779a906b70Schristos
637803b705cfSriastradh			if (kgem->nfence >= kgem->fence_max)
637903b705cfSriastradh				return false;
638003b705cfSriastradh
63819a906b70Schristos			if (kgem->aperture_fenced) {
63829a906b70Schristos				size = 3*kgem->aperture_fenced;
63839a906b70Schristos				if (kgem->aperture_total == kgem->aperture_mappable)
63849a906b70Schristos					size += kgem->aperture;
63859a906b70Schristos				if (size > kgem->aperture_fenceable &&
63869a906b70Schristos				    kgem_ring_is_idle(kgem, kgem->ring)) {
63879a906b70Schristos					DBG(("%s: opportunistic fence flush\n", __FUNCTION__));
63889a906b70Schristos					return false;
63899a906b70Schristos				}
63909a906b70Schristos			}
639103b705cfSriastradh
63929a906b70Schristos			size = kgem_bo_fenced_size(kgem, bo);
63939a906b70Schristos			if (size > kgem->aperture_max_fence)
63949a906b70Schristos				kgem->aperture_max_fence = size;
63959a906b70Schristos			size += kgem->aperture_fenced;
63969a906b70Schristos			if (kgem->gen < 033 && size < 2 * kgem->aperture_max_fence)
63979a906b70Schristos				size = 2 * kgem->aperture_max_fence;
63989a906b70Schristos			if (kgem->aperture_total == kgem->aperture_mappable)
63999a906b70Schristos				size += kgem->aperture;
64009a906b70Schristos			if (size > kgem->aperture_fenceable) {
64019a906b70Schristos				DBG(("%s: estimated fence space required %d (fenced=%d, max_fence=%d, aperture=%d) exceeds fenceable aperture %d\n",
64029a906b70Schristos				     __FUNCTION__, size, kgem->aperture_fenced, kgem->aperture_max_fence, kgem->aperture, kgem->aperture_fenceable));
640303b705cfSriastradh				return false;
64049a906b70Schristos			}
640503b705cfSriastradh		}
640603b705cfSriastradh
640703b705cfSriastradh		return true;
640803b705cfSriastradh	}
640903b705cfSriastradh
641003b705cfSriastradh	if (kgem->nexec >= KGEM_EXEC_SIZE(kgem) - 1)
641103b705cfSriastradh		return false;
641203b705cfSriastradh
64139a906b70Schristos	if (needs_batch_flush(kgem, bo))
641403b705cfSriastradh		return false;
641503b705cfSriastradh
641603b705cfSriastradh	assert_tiling(kgem, bo);
641703b705cfSriastradh	if (kgem->gen < 040 && bo->tiling != I915_TILING_NONE) {
64189a906b70Schristos		uint32_t size;
64199a906b70Schristos
64209a906b70Schristos		assert(bo->tiling == I915_TILING_X);
64219a906b70Schristos
642203b705cfSriastradh		if (kgem->nfence >= kgem->fence_max)
642303b705cfSriastradh			return false;
642403b705cfSriastradh
64259a906b70Schristos		if (kgem->aperture_fenced) {
64269a906b70Schristos			size = 3*kgem->aperture_fenced;
64279a906b70Schristos			if (kgem->aperture_total == kgem->aperture_mappable)
64289a906b70Schristos				size += kgem->aperture;
64299a906b70Schristos			if (size > kgem->aperture_fenceable &&
64309a906b70Schristos			    kgem_ring_is_idle(kgem, kgem->ring)) {
64319a906b70Schristos				DBG(("%s: opportunistic fence flush\n", __FUNCTION__));
64329a906b70Schristos				return false;
64339a906b70Schristos			}
64349a906b70Schristos		}
643503b705cfSriastradh
64369a906b70Schristos		size = kgem_bo_fenced_size(kgem, bo);
64379a906b70Schristos		if (size > kgem->aperture_max_fence)
64389a906b70Schristos			kgem->aperture_max_fence = size;
64399a906b70Schristos		size += kgem->aperture_fenced;
64409a906b70Schristos		if (kgem->gen < 033 && size < 2 * kgem->aperture_max_fence)
64419a906b70Schristos			size = 2 * kgem->aperture_max_fence;
64429a906b70Schristos		if (kgem->aperture_total == kgem->aperture_mappable)
64439a906b70Schristos			size += kgem->aperture;
64449a906b70Schristos		if (size > kgem->aperture_fenceable) {
64459a906b70Schristos			DBG(("%s: estimated fence space required %d (fenced=%d, max_fence=%d, aperture=%d) exceeds fenceable aperture %d\n",
64469a906b70Schristos			     __FUNCTION__, size, kgem->aperture_fenced, kgem->aperture_max_fence, kgem->aperture, kgem->aperture_fenceable));
644703b705cfSriastradh			return false;
64489a906b70Schristos		}
644903b705cfSriastradh	}
645003b705cfSriastradh
64519a906b70Schristos	if (kgem->aperture + kgem->aperture_fenced + num_pages(bo) > kgem->aperture_high) {
64529a906b70Schristos		DBG(("%s: final aperture usage (%d + %d) is greater than high water mark (%d)\n",
64539a906b70Schristos		     __FUNCTION__, kgem->aperture, num_pages(bo), kgem->aperture_high));
64549a906b70Schristos		return aperture_check(kgem, num_pages(bo));
64559a906b70Schristos	}
64569a906b70Schristos
64579a906b70Schristos	if (bo->rq)
64589a906b70Schristos		return true;
64599a906b70Schristos
64609a906b70Schristos	return kgem_flush(kgem, bo->flush);
646103b705cfSriastradh}
646203b705cfSriastradh
646303b705cfSriastradhbool kgem_check_many_bo_fenced(struct kgem *kgem, ...)
646403b705cfSriastradh{
646503b705cfSriastradh	va_list ap;
646603b705cfSriastradh	struct kgem_bo *bo;
646703b705cfSriastradh	int num_fence = 0;
646803b705cfSriastradh	int num_exec = 0;
646903b705cfSriastradh	int num_pages = 0;
647003b705cfSriastradh	int fenced_size = 0;
647103b705cfSriastradh	bool flush = false;
64729a906b70Schristos	bool busy = true;
647303b705cfSriastradh
647403b705cfSriastradh	va_start(ap, kgem);
647503b705cfSriastradh	while ((bo = va_arg(ap, struct kgem_bo *))) {
647603b705cfSriastradh		assert(bo->refcnt);
647703b705cfSriastradh		while (bo->proxy)
647803b705cfSriastradh			bo = bo->proxy;
647903b705cfSriastradh		assert(bo->refcnt);
648003b705cfSriastradh		if (bo->exec) {
648103b705cfSriastradh			if (kgem->gen >= 040 || bo->tiling == I915_TILING_NONE)
648203b705cfSriastradh				continue;
648303b705cfSriastradh
648403b705cfSriastradh			if ((bo->exec->flags & EXEC_OBJECT_NEEDS_FENCE) == 0) {
648503b705cfSriastradh				fenced_size += kgem_bo_fenced_size(kgem, bo);
648603b705cfSriastradh				num_fence++;
648703b705cfSriastradh			}
648803b705cfSriastradh
648903b705cfSriastradh			continue;
649003b705cfSriastradh		}
649103b705cfSriastradh
64929a906b70Schristos		if (needs_batch_flush(kgem, bo)) {
64939a906b70Schristos			va_end(ap);
649403b705cfSriastradh			return false;
64959a906b70Schristos		}
649603b705cfSriastradh
649703b705cfSriastradh		assert_tiling(kgem, bo);
649803b705cfSriastradh		num_pages += num_pages(bo);
649903b705cfSriastradh		num_exec++;
650003b705cfSriastradh		if (kgem->gen < 040 && bo->tiling) {
65019a906b70Schristos			uint32_t size = kgem_bo_fenced_size(kgem, bo);
65029a906b70Schristos			if (size > kgem->aperture_max_fence)
65039a906b70Schristos				kgem->aperture_max_fence = size;
65049a906b70Schristos			fenced_size += size;
650503b705cfSriastradh			num_fence++;
650603b705cfSriastradh		}
650703b705cfSriastradh
650803b705cfSriastradh		flush |= bo->flush;
65099a906b70Schristos		busy &= bo->rq != NULL;
651003b705cfSriastradh	}
651103b705cfSriastradh	va_end(ap);
651203b705cfSriastradh
651303b705cfSriastradh	if (num_fence) {
65149a906b70Schristos		uint32_t size;
65159a906b70Schristos
651603b705cfSriastradh		if (kgem->nfence + num_fence > kgem->fence_max)
651703b705cfSriastradh			return false;
651803b705cfSriastradh
65199a906b70Schristos		if (kgem->aperture_fenced) {
65209a906b70Schristos			size = 3*kgem->aperture_fenced;
65219a906b70Schristos			if (kgem->aperture_total == kgem->aperture_mappable)
65229a906b70Schristos				size += kgem->aperture;
65239a906b70Schristos			if (size > kgem->aperture_fenceable &&
65249a906b70Schristos			    kgem_ring_is_idle(kgem, kgem->ring)) {
65259a906b70Schristos				DBG(("%s: opportunistic fence flush\n", __FUNCTION__));
65269a906b70Schristos				return false;
65279a906b70Schristos			}
65289a906b70Schristos		}
652903b705cfSriastradh
65309a906b70Schristos		size = kgem->aperture_fenced;
65319a906b70Schristos		size += fenced_size;
65329a906b70Schristos		if (kgem->gen < 033 && size < 2 * kgem->aperture_max_fence)
65339a906b70Schristos			size = 2 * kgem->aperture_max_fence;
65349a906b70Schristos		if (kgem->aperture_total == kgem->aperture_mappable)
65359a906b70Schristos			size += kgem->aperture;
65369a906b70Schristos		if (size > kgem->aperture_fenceable) {
65379a906b70Schristos			DBG(("%s: estimated fence space required %d (fenced=%d, max_fence=%d, aperture=%d) exceeds fenceable aperture %d\n",
65389a906b70Schristos			     __FUNCTION__, size, kgem->aperture_fenced, kgem->aperture_max_fence, kgem->aperture, kgem->aperture_fenceable));
653903b705cfSriastradh			return false;
65409a906b70Schristos		}
654103b705cfSriastradh	}
654203b705cfSriastradh
65439a906b70Schristos	if (num_pages == 0)
65449a906b70Schristos		return true;
654503b705cfSriastradh
65469a906b70Schristos	if (kgem->nexec + num_exec >= KGEM_EXEC_SIZE(kgem))
65479a906b70Schristos		return false;
654803b705cfSriastradh
65499a906b70Schristos	if (num_pages + kgem->aperture > kgem->aperture_high - kgem->aperture_fenced) {
65509a906b70Schristos		DBG(("%s: final aperture usage (%d + %d + %d) is greater than high water mark (%d)\n",
65519a906b70Schristos		     __FUNCTION__, kgem->aperture, kgem->aperture_fenced, num_pages, kgem->aperture_high));
65529a906b70Schristos		return aperture_check(kgem, num_pages);
655303b705cfSriastradh	}
655403b705cfSriastradh
65559a906b70Schristos	if (busy)
65569a906b70Schristos		return true;
65579a906b70Schristos
65589a906b70Schristos	return kgem_flush(kgem, flush);
655903b705cfSriastradh}
656003b705cfSriastradh
656163ef14f0Smrgvoid __kgem_bcs_set_tiling(struct kgem *kgem,
656263ef14f0Smrg			   struct kgem_bo *src,
656363ef14f0Smrg			   struct kgem_bo *dst)
656463ef14f0Smrg{
656563ef14f0Smrg	uint32_t state, *b;
656663ef14f0Smrg
656763ef14f0Smrg	DBG(("%s: src handle=%d:tiling=%d, dst handle=%d:tiling=%d\n",
656863ef14f0Smrg	     __FUNCTION__,
656963ef14f0Smrg	     src ? src->handle : 0, src ? src->tiling : 0,
657063ef14f0Smrg	     dst ? dst->handle : 0, dst ? dst->tiling : 0));
657163ef14f0Smrg	assert(kgem->mode == KGEM_BLT);
657263ef14f0Smrg	assert(dst == NULL || kgem_bo_can_blt(kgem, dst));
657363ef14f0Smrg	assert(src == NULL || kgem_bo_can_blt(kgem, src));
657463ef14f0Smrg
657563ef14f0Smrg	state = 0;
657663ef14f0Smrg	if (dst && dst->tiling == I915_TILING_Y)
657763ef14f0Smrg		state |= BCS_DST_Y;
657863ef14f0Smrg	if (src && src->tiling == I915_TILING_Y)
657963ef14f0Smrg		state |= BCS_SRC_Y;
658063ef14f0Smrg
658163ef14f0Smrg	if (kgem->bcs_state == state)
658263ef14f0Smrg		return;
658363ef14f0Smrg
658463ef14f0Smrg	DBG(("%s: updating SWCTRL %x -> %x\n", __FUNCTION__,
658563ef14f0Smrg	     kgem->bcs_state, state));
658663ef14f0Smrg
658763ef14f0Smrg	/* Over-estimate space in case we need to re-emit the cmd packet */
658863ef14f0Smrg	if (!kgem_check_batch(kgem, 24)) {
658963ef14f0Smrg		_kgem_submit(kgem);
659063ef14f0Smrg		_kgem_set_mode(kgem, KGEM_BLT);
659163ef14f0Smrg		if (state == 0)
659263ef14f0Smrg			return;
659363ef14f0Smrg	}
659463ef14f0Smrg
659563ef14f0Smrg	b = kgem->batch + kgem->nbatch;
659663ef14f0Smrg	if (kgem->nbatch) {
659763ef14f0Smrg		*b++ = MI_FLUSH_DW;
659863ef14f0Smrg		*b++ = 0;
659963ef14f0Smrg		*b++ = 0;
660063ef14f0Smrg		*b++ = 0;
660163ef14f0Smrg	}
660263ef14f0Smrg	*b++ = MI_LOAD_REGISTER_IMM;
660363ef14f0Smrg	*b++ = BCS_SWCTRL;
660463ef14f0Smrg	*b++ = (BCS_SRC_Y | BCS_DST_Y) << 16 | state;
660563ef14f0Smrg	kgem->nbatch = b - kgem->batch;
660663ef14f0Smrg
660763ef14f0Smrg	kgem->bcs_state = state;
660863ef14f0Smrg}
660963ef14f0Smrg
661003b705cfSriastradhuint32_t kgem_add_reloc(struct kgem *kgem,
661103b705cfSriastradh			uint32_t pos,
661203b705cfSriastradh			struct kgem_bo *bo,
661303b705cfSriastradh			uint32_t read_write_domain,
661403b705cfSriastradh			uint32_t delta)
661503b705cfSriastradh{
661603b705cfSriastradh	int index;
661703b705cfSriastradh
661803b705cfSriastradh	DBG(("%s: handle=%d, pos=%d, delta=%d, domains=%08x\n",
661903b705cfSriastradh	     __FUNCTION__, bo ? bo->handle : 0, pos, delta, read_write_domain));
662003b705cfSriastradh
66219a906b70Schristos	assert(kgem->gen < 0100);
662203b705cfSriastradh	assert((read_write_domain & 0x7fff) == 0 || bo != NULL);
662303b705cfSriastradh
662403b705cfSriastradh	index = kgem->nreloc++;
662503b705cfSriastradh	assert(index < ARRAY_SIZE(kgem->reloc));
662603b705cfSriastradh	kgem->reloc[index].offset = pos * sizeof(kgem->batch[0]);
662703b705cfSriastradh	if (bo) {
66289a906b70Schristos		assert(kgem->mode != KGEM_NONE);
662903b705cfSriastradh		assert(bo->refcnt);
663003b705cfSriastradh		while (bo->proxy) {
663103b705cfSriastradh			DBG(("%s: adding proxy [delta=%d] for handle=%d\n",
663203b705cfSriastradh			     __FUNCTION__, bo->delta, bo->handle));
663303b705cfSriastradh			delta += bo->delta;
663403b705cfSriastradh			assert(bo->handle == bo->proxy->handle);
663503b705cfSriastradh			/* need to release the cache upon batch submit */
663603b705cfSriastradh			if (bo->exec == NULL) {
663703b705cfSriastradh				list_move_tail(&bo->request,
663803b705cfSriastradh					       &kgem->next_request->buffers);
663903b705cfSriastradh				bo->rq = MAKE_REQUEST(kgem->next_request,
664003b705cfSriastradh						      kgem->ring);
664103b705cfSriastradh				bo->exec = &_kgem_dummy_exec;
66429a906b70Schristos				bo->domain = DOMAIN_GPU;
664303b705cfSriastradh			}
664403b705cfSriastradh
664503b705cfSriastradh			if (read_write_domain & 0x7fff && !bo->gpu_dirty)
664603b705cfSriastradh				__kgem_bo_mark_dirty(bo);
664703b705cfSriastradh
664803b705cfSriastradh			bo = bo->proxy;
664903b705cfSriastradh			assert(bo->refcnt);
665003b705cfSriastradh		}
665103b705cfSriastradh		assert(bo->refcnt);
665203b705cfSriastradh
665303b705cfSriastradh		if (bo->exec == NULL)
665403b705cfSriastradh			kgem_add_bo(kgem, bo);
665503b705cfSriastradh		assert(bo->rq == MAKE_REQUEST(kgem->next_request, kgem->ring));
665603b705cfSriastradh		assert(RQ_RING(bo->rq) == kgem->ring);
665703b705cfSriastradh
665803b705cfSriastradh		if (kgem->gen < 040 && read_write_domain & KGEM_RELOC_FENCED) {
665903b705cfSriastradh			if (bo->tiling &&
666003b705cfSriastradh			    (bo->exec->flags & EXEC_OBJECT_NEEDS_FENCE) == 0) {
66619a906b70Schristos				assert(bo->tiling == I915_TILING_X);
666203b705cfSriastradh				assert(kgem->nfence < kgem->fence_max);
666303b705cfSriastradh				kgem->aperture_fenced +=
666403b705cfSriastradh					kgem_bo_fenced_size(kgem, bo);
666503b705cfSriastradh				kgem->nfence++;
666603b705cfSriastradh			}
666703b705cfSriastradh			bo->exec->flags |= EXEC_OBJECT_NEEDS_FENCE;
666803b705cfSriastradh		}
666903b705cfSriastradh
667003b705cfSriastradh		kgem->reloc[index].delta = delta;
667103b705cfSriastradh		kgem->reloc[index].target_handle = bo->target_handle;
667203b705cfSriastradh		kgem->reloc[index].presumed_offset = bo->presumed_offset;
667303b705cfSriastradh
667403b705cfSriastradh		if (read_write_domain & 0x7fff && !bo->gpu_dirty) {
667503b705cfSriastradh			assert(!bo->snoop || kgem->can_blt_cpu);
667603b705cfSriastradh			__kgem_bo_mark_dirty(bo);
667703b705cfSriastradh		}
667803b705cfSriastradh
667903b705cfSriastradh		delta += bo->presumed_offset;
668003b705cfSriastradh	} else {
668103b705cfSriastradh		kgem->reloc[index].delta = delta;
668203b705cfSriastradh		kgem->reloc[index].target_handle = ~0U;
668303b705cfSriastradh		kgem->reloc[index].presumed_offset = 0;
668403b705cfSriastradh		if (kgem->nreloc__self < 256)
668503b705cfSriastradh			kgem->reloc__self[kgem->nreloc__self++] = index;
668603b705cfSriastradh	}
668703b705cfSriastradh	kgem->reloc[index].read_domains = read_write_domain >> 16;
668803b705cfSriastradh	kgem->reloc[index].write_domain = read_write_domain & 0x7fff;
668903b705cfSriastradh
669003b705cfSriastradh	return delta;
669103b705cfSriastradh}
669203b705cfSriastradh
66939a906b70Schristosuint64_t kgem_add_reloc64(struct kgem *kgem,
66949a906b70Schristos			  uint32_t pos,
66959a906b70Schristos			  struct kgem_bo *bo,
66969a906b70Schristos			  uint32_t read_write_domain,
66979a906b70Schristos			  uint64_t delta)
66989a906b70Schristos{
66999a906b70Schristos	int index;
67009a906b70Schristos
67019a906b70Schristos	DBG(("%s: handle=%d, pos=%d, delta=%ld, domains=%08x\n",
67029a906b70Schristos	     __FUNCTION__, bo ? bo->handle : 0, pos, (long)delta, read_write_domain));
67039a906b70Schristos
67049a906b70Schristos	assert(kgem->gen >= 0100);
67059a906b70Schristos	assert((read_write_domain & 0x7fff) == 0 || bo != NULL);
67069a906b70Schristos
67079a906b70Schristos	index = kgem->nreloc++;
67089a906b70Schristos	assert(index < ARRAY_SIZE(kgem->reloc));
67099a906b70Schristos	kgem->reloc[index].offset = pos * sizeof(kgem->batch[0]);
67109a906b70Schristos	if (bo) {
67119a906b70Schristos		assert(kgem->mode != KGEM_NONE);
67129a906b70Schristos		assert(bo->refcnt);
67139a906b70Schristos		while (bo->proxy) {
67149a906b70Schristos			DBG(("%s: adding proxy [delta=%ld] for handle=%d\n",
67159a906b70Schristos			     __FUNCTION__, (long)bo->delta, bo->handle));
67169a906b70Schristos			delta += bo->delta;
67179a906b70Schristos			assert(bo->handle == bo->proxy->handle);
67189a906b70Schristos			/* need to release the cache upon batch submit */
67199a906b70Schristos			if (bo->exec == NULL) {
67209a906b70Schristos				list_move_tail(&bo->request,
67219a906b70Schristos					       &kgem->next_request->buffers);
67229a906b70Schristos				bo->rq = MAKE_REQUEST(kgem->next_request,
67239a906b70Schristos						      kgem->ring);
67249a906b70Schristos				bo->exec = &_kgem_dummy_exec;
67259a906b70Schristos				bo->domain = DOMAIN_GPU;
67269a906b70Schristos			}
67279a906b70Schristos
67289a906b70Schristos			if (read_write_domain & 0x7fff && !bo->gpu_dirty)
67299a906b70Schristos				__kgem_bo_mark_dirty(bo);
67309a906b70Schristos
67319a906b70Schristos			bo = bo->proxy;
67329a906b70Schristos			assert(bo->refcnt);
67339a906b70Schristos		}
67349a906b70Schristos		assert(bo->refcnt);
67359a906b70Schristos
67369a906b70Schristos		if (bo->exec == NULL)
67379a906b70Schristos			kgem_add_bo(kgem, bo);
67389a906b70Schristos		assert(bo->rq == MAKE_REQUEST(kgem->next_request, kgem->ring));
67399a906b70Schristos		assert(RQ_RING(bo->rq) == kgem->ring);
67409a906b70Schristos
67419a906b70Schristos		DBG(("%s[%d] = (delta=%d, target handle=%d, presumed=%llx)\n",
67429a906b70Schristos					__FUNCTION__, index, delta, bo->target_handle, (long long)bo->presumed_offset));
67439a906b70Schristos		kgem->reloc[index].delta = delta;
67449a906b70Schristos		kgem->reloc[index].target_handle = bo->target_handle;
67459a906b70Schristos		kgem->reloc[index].presumed_offset = bo->presumed_offset;
67469a906b70Schristos
67479a906b70Schristos		if (read_write_domain & 0x7fff && !bo->gpu_dirty) {
67489a906b70Schristos			assert(!bo->snoop || kgem->can_blt_cpu);
67499a906b70Schristos			__kgem_bo_mark_dirty(bo);
67509a906b70Schristos		}
67519a906b70Schristos
67529a906b70Schristos		delta += bo->presumed_offset;
67539a906b70Schristos	} else {
67549a906b70Schristos		DBG(("%s[%d] = (delta=%d, target handle=batch)\n",
67559a906b70Schristos					__FUNCTION__, index, delta));
67569a906b70Schristos		kgem->reloc[index].delta = delta;
67579a906b70Schristos		kgem->reloc[index].target_handle = ~0U;
67589a906b70Schristos		kgem->reloc[index].presumed_offset = 0;
67599a906b70Schristos		if (kgem->nreloc__self < 256)
67609a906b70Schristos			kgem->reloc__self[kgem->nreloc__self++] = index;
67619a906b70Schristos	}
67629a906b70Schristos	kgem->reloc[index].read_domains = read_write_domain >> 16;
67639a906b70Schristos	kgem->reloc[index].write_domain = read_write_domain & 0x7fff;
67649a906b70Schristos
67659a906b70Schristos	return delta;
67669a906b70Schristos}
67679a906b70Schristos
676803b705cfSriastradhstatic void kgem_trim_vma_cache(struct kgem *kgem, int type, int bucket)
676903b705cfSriastradh{
677003b705cfSriastradh	int i, j;
677103b705cfSriastradh
677203b705cfSriastradh	DBG(("%s: type=%d, count=%d (bucket: %d)\n",
677303b705cfSriastradh	     __FUNCTION__, type, kgem->vma[type].count, bucket));
677403b705cfSriastradh	if (kgem->vma[type].count <= 0)
677503b705cfSriastradh	       return;
677603b705cfSriastradh
677703b705cfSriastradh	if (kgem->need_purge)
677803b705cfSriastradh		kgem_purge_cache(kgem);
677903b705cfSriastradh
678003b705cfSriastradh	/* vma are limited on a per-process basis to around 64k.
678103b705cfSriastradh	 * This includes all malloc arenas as well as other file
678203b705cfSriastradh	 * mappings. In order to be fair and not hog the cache,
678303b705cfSriastradh	 * and more importantly not to exhaust that limit and to
678403b705cfSriastradh	 * start failing mappings, we keep our own number of open
678503b705cfSriastradh	 * vma to within a conservative value.
678603b705cfSriastradh	 */
678703b705cfSriastradh	i = 0;
678803b705cfSriastradh	while (kgem->vma[type].count > 0) {
678903b705cfSriastradh		struct kgem_bo *bo = NULL;
679003b705cfSriastradh
679103b705cfSriastradh		for (j = 0;
679203b705cfSriastradh		     bo == NULL && j < ARRAY_SIZE(kgem->vma[type].inactive);
679303b705cfSriastradh		     j++) {
679403b705cfSriastradh			struct list *head = &kgem->vma[type].inactive[i++%ARRAY_SIZE(kgem->vma[type].inactive)];
679503b705cfSriastradh			if (!list_is_empty(head))
679603b705cfSriastradh				bo = list_last_entry(head, struct kgem_bo, vma);
679703b705cfSriastradh		}
679803b705cfSriastradh		if (bo == NULL)
679903b705cfSriastradh			break;
680003b705cfSriastradh
680103b705cfSriastradh		DBG(("%s: discarding inactive %s vma cache for %d\n",
68029a906b70Schristos		     __FUNCTION__, type ? "CPU" : "GTT", bo->handle));
68039a906b70Schristos
680403b705cfSriastradh		assert(bo->rq == NULL);
6805813957e3Ssnj		if (type) {
6806813957e3Ssnj			VG(VALGRIND_MAKE_MEM_NOACCESS(MAP(bo->map__cpu), bytes(bo)));
6807813957e3Ssnj			munmap(MAP(bo->map__cpu), bytes(bo));
6808813957e3Ssnj			bo->map__cpu = NULL;
6809813957e3Ssnj		} else {
6810813957e3Ssnj			if (bo->map__wc) {
6811813957e3Ssnj				VG(VALGRIND_MAKE_MEM_NOACCESS(bo->map__wc, bytes(bo)));
6812813957e3Ssnj				munmap(bo->map__wc, bytes(bo));
6813813957e3Ssnj				bo->map__wc = NULL;
6814813957e3Ssnj			}
6815813957e3Ssnj			if (bo->map__gtt) {
6816813957e3Ssnj				munmap(bo->map__gtt, bytes(bo));
6817813957e3Ssnj				bo->map__gtt = NULL;
6818813957e3Ssnj			}
6819813957e3Ssnj		}
682003b705cfSriastradh
682103b705cfSriastradh		list_del(&bo->vma);
682203b705cfSriastradh		kgem->vma[type].count--;
682303b705cfSriastradh	}
682403b705cfSriastradh}
682503b705cfSriastradh
6826813957e3Ssnjstatic void *__kgem_bo_map__gtt_or_wc(struct kgem *kgem, struct kgem_bo *bo)
682703b705cfSriastradh{
682803b705cfSriastradh	void *ptr;
682903b705cfSriastradh
6830813957e3Ssnj	DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle));
6831813957e3Ssnj
6832813957e3Ssnj	assert(bo->proxy == NULL);
6833813957e3Ssnj	assert(!bo->snoop);
6834813957e3Ssnj
6835813957e3Ssnj	kgem_trim_vma_cache(kgem, MAP_GTT, bucket(bo));
6836813957e3Ssnj
6837813957e3Ssnj	if (bo->tiling || !kgem->has_wc_mmap) {
6838813957e3Ssnj		assert(kgem->gen != 021 || bo->tiling != I915_TILING_Y);
683963ef14f0Smrg		warn_unless(num_pages(bo) <= kgem->aperture_mappable / 2);
6840813957e3Ssnj
6841813957e3Ssnj		ptr = bo->map__gtt;
6842813957e3Ssnj		if (ptr == NULL)
6843813957e3Ssnj			ptr = __kgem_bo_map__gtt(kgem, bo);
6844813957e3Ssnj	} else {
6845813957e3Ssnj		ptr = bo->map__wc;
6846813957e3Ssnj		if (ptr == NULL)
6847813957e3Ssnj			ptr = __kgem_bo_map__wc(kgem, bo);
6848813957e3Ssnj	}
6849813957e3Ssnj
6850813957e3Ssnj	return ptr;
6851813957e3Ssnj}
6852813957e3Ssnj
6853813957e3Ssnjvoid *kgem_bo_map__async(struct kgem *kgem, struct kgem_bo *bo)
6854813957e3Ssnj{
68559a906b70Schristos	DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__,
68569a906b70Schristos	     bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain));
685703b705cfSriastradh
685803b705cfSriastradh	assert(bo->proxy == NULL);
685903b705cfSriastradh	assert(list_is_empty(&bo->list));
686003b705cfSriastradh	assert_tiling(kgem, bo);
68619a906b70Schristos	assert(!bo->purged || bo->reusable);
686203b705cfSriastradh
686303b705cfSriastradh	if (bo->tiling == I915_TILING_NONE && !bo->scanout && kgem->has_llc) {
686403b705cfSriastradh		DBG(("%s: converting request for GTT map into CPU map\n",
686503b705cfSriastradh		     __FUNCTION__));
686603b705cfSriastradh		return kgem_bo_map__cpu(kgem, bo);
686703b705cfSriastradh	}
686803b705cfSriastradh
6869813957e3Ssnj	return __kgem_bo_map__gtt_or_wc(kgem, bo);
687003b705cfSriastradh}
687103b705cfSriastradh
687203b705cfSriastradhvoid *kgem_bo_map(struct kgem *kgem, struct kgem_bo *bo)
687303b705cfSriastradh{
687403b705cfSriastradh	void *ptr;
687503b705cfSriastradh
68769a906b70Schristos	DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__,
68779a906b70Schristos	     bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain));
687803b705cfSriastradh
687903b705cfSriastradh	assert(bo->proxy == NULL);
688003b705cfSriastradh	assert(list_is_empty(&bo->list));
688103b705cfSriastradh	assert(bo->exec == NULL);
688203b705cfSriastradh	assert_tiling(kgem, bo);
68839a906b70Schristos	assert(!bo->purged || bo->reusable);
688403b705cfSriastradh
688503b705cfSriastradh	if (bo->tiling == I915_TILING_NONE && !bo->scanout &&
688603b705cfSriastradh	    (kgem->has_llc || bo->domain == DOMAIN_CPU)) {
688703b705cfSriastradh		DBG(("%s: converting request for GTT map into CPU map\n",
688803b705cfSriastradh		     __FUNCTION__));
688903b705cfSriastradh		ptr = kgem_bo_map__cpu(kgem, bo);
689003b705cfSriastradh		if (ptr)
689103b705cfSriastradh			kgem_bo_sync__cpu(kgem, bo);
689203b705cfSriastradh		return ptr;
689303b705cfSriastradh	}
689403b705cfSriastradh
6895813957e3Ssnj	ptr = __kgem_bo_map__gtt_or_wc(kgem, bo);
689603b705cfSriastradh
689703b705cfSriastradh	if (bo->domain != DOMAIN_GTT || FORCE_MMAP_SYNC & (1 << DOMAIN_GTT)) {
689803b705cfSriastradh		struct drm_i915_gem_set_domain set_domain;
689903b705cfSriastradh
690003b705cfSriastradh		DBG(("%s: sync: needs_flush? %d, domain? %d, busy? %d\n", __FUNCTION__,
690103b705cfSriastradh		     bo->needs_flush, bo->domain, __kgem_busy(kgem, bo->handle)));
690203b705cfSriastradh
690303b705cfSriastradh		/* XXX use PROT_READ to avoid the write flush? */
690403b705cfSriastradh
690503b705cfSriastradh		VG_CLEAR(set_domain);
690603b705cfSriastradh		set_domain.handle = bo->handle;
690703b705cfSriastradh		set_domain.read_domains = I915_GEM_DOMAIN_GTT;
690803b705cfSriastradh		set_domain.write_domain = I915_GEM_DOMAIN_GTT;
69099a906b70Schristos		if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) {
69109a906b70Schristos			DBG(("%s: sync: GPU hang detected\n", __FUNCTION__));
69119a906b70Schristos			kgem_throttle(kgem);
691203b705cfSriastradh		}
691363ef14f0Smrg		bo->needs_flush = false;
69149a906b70Schristos		kgem_bo_retire(kgem, bo);
69159a906b70Schristos		bo->domain = DOMAIN_GTT;
69169a906b70Schristos		bo->gtt_dirty = true;
691703b705cfSriastradh	}
691803b705cfSriastradh
691903b705cfSriastradh	return ptr;
692003b705cfSriastradh}
692103b705cfSriastradh
692203b705cfSriastradhvoid *kgem_bo_map__gtt(struct kgem *kgem, struct kgem_bo *bo)
692303b705cfSriastradh{
69249a906b70Schristos	DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__,
69259a906b70Schristos	     bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain));
692603b705cfSriastradh
69279a906b70Schristos	assert(bo->proxy == NULL);
692803b705cfSriastradh	assert(bo->exec == NULL);
692903b705cfSriastradh	assert(list_is_empty(&bo->list));
693003b705cfSriastradh	assert_tiling(kgem, bo);
69319a906b70Schristos	assert(!bo->purged || bo->reusable);
693203b705cfSriastradh
6933813957e3Ssnj	return __kgem_bo_map__gtt_or_wc(kgem, bo);
6934813957e3Ssnj}
693503b705cfSriastradh
6936813957e3Ssnjvoid *kgem_bo_map__wc(struct kgem *kgem, struct kgem_bo *bo)
6937813957e3Ssnj{
6938813957e3Ssnj	DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__,
6939813957e3Ssnj	     bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain));
694003b705cfSriastradh
6941813957e3Ssnj	assert(bo->proxy == NULL);
6942813957e3Ssnj	assert(list_is_empty(&bo->list));
6943813957e3Ssnj	assert_tiling(kgem, bo);
6944813957e3Ssnj	assert(!bo->purged || bo->reusable);
694503b705cfSriastradh
6946813957e3Ssnj	if (bo->map__wc)
6947813957e3Ssnj		return bo->map__wc;
694863ef14f0Smrg	if (!kgem->has_wc_mmap)
694963ef14f0Smrg		return NULL;
695003b705cfSriastradh
695163ef14f0Smrg	kgem_trim_vma_cache(kgem, MAP_GTT, bucket(bo));
6952813957e3Ssnj	return __kgem_bo_map__wc(kgem, bo);
695303b705cfSriastradh}
695403b705cfSriastradh
695503b705cfSriastradhvoid *kgem_bo_map__cpu(struct kgem *kgem, struct kgem_bo *bo)
695603b705cfSriastradh{
69579a906b70Schristos	DBG(("%s(handle=%d, size=%d, map=%p:%p)\n",
69589a906b70Schristos	     __FUNCTION__, bo->handle, bytes(bo), bo->map__gtt, bo->map__cpu));
695903b705cfSriastradh	assert(!bo->purged);
696003b705cfSriastradh	assert(list_is_empty(&bo->list));
696103b705cfSriastradh	assert(bo->proxy == NULL);
69629a906b70Schristos	assert_tiling(kgem, bo);
696303b705cfSriastradh
69649a906b70Schristos	if (bo->map__cpu)
69659a906b70Schristos		return MAP(bo->map__cpu);
696603b705cfSriastradh
696703b705cfSriastradh	kgem_trim_vma_cache(kgem, MAP_CPU, bucket(bo));
696803b705cfSriastradh
6969813957e3Ssnj	return __kgem_bo_map__cpu(kgem, bo);
6970813957e3Ssnj}
697103b705cfSriastradh
6972813957e3Ssnjvoid *kgem_bo_map__debug(struct kgem *kgem, struct kgem_bo *bo)
6973813957e3Ssnj{
6974813957e3Ssnj	void *ptr;
697503b705cfSriastradh
6976813957e3Ssnj	if (bo->tiling == I915_TILING_NONE && kgem->has_llc) {
6977813957e3Ssnj		ptr = MAP(bo->map__cpu);
6978813957e3Ssnj		if (ptr == NULL)
6979813957e3Ssnj			ptr = __kgem_bo_map__cpu(kgem, bo);
6980813957e3Ssnj	} else if (bo->tiling || !kgem->has_wc_mmap) {
6981813957e3Ssnj		ptr = bo->map__gtt;
6982813957e3Ssnj		if (ptr == NULL)
6983813957e3Ssnj			ptr = __kgem_bo_map__gtt(kgem, bo);
6984813957e3Ssnj	} else {
6985813957e3Ssnj		ptr = bo->map__wc;
6986813957e3Ssnj		if (ptr == NULL)
6987813957e3Ssnj			ptr = __kgem_bo_map__wc(kgem, bo);
698803b705cfSriastradh	}
698903b705cfSriastradh
6990813957e3Ssnj	return ptr;
699103b705cfSriastradh}
699203b705cfSriastradh
6993813957e3Ssnj
699403b705cfSriastradhuint32_t kgem_bo_flink(struct kgem *kgem, struct kgem_bo *bo)
699503b705cfSriastradh{
699603b705cfSriastradh	struct drm_gem_flink flink;
699703b705cfSriastradh
699863ef14f0Smrg	assert(kgem_bo_is_fenced(kgem, bo));
699963ef14f0Smrg
700003b705cfSriastradh	VG_CLEAR(flink);
700103b705cfSriastradh	flink.handle = bo->handle;
70029a906b70Schristos	if (do_ioctl(kgem->fd, DRM_IOCTL_GEM_FLINK, &flink))
700303b705cfSriastradh		return 0;
700403b705cfSriastradh
700503b705cfSriastradh	DBG(("%s: flinked handle=%d to name=%d, marking non-reusable\n",
700603b705cfSriastradh	     __FUNCTION__, flink.handle, flink.name));
700703b705cfSriastradh
700803b705cfSriastradh	/* Ordinarily giving the name aware makes the buffer non-reusable.
700903b705cfSriastradh	 * However, we track the lifetime of all clients and their hold
701003b705cfSriastradh	 * on the buffer, and *presuming* they do not pass it on to a third
701103b705cfSriastradh	 * party, we track the lifetime accurately.
701203b705cfSriastradh	 */
701303b705cfSriastradh	bo->reusable = false;
701403b705cfSriastradh	kgem_bo_unclean(kgem, bo);
701503b705cfSriastradh
701603b705cfSriastradh	return flink.name;
701703b705cfSriastradh}
701803b705cfSriastradh
701903b705cfSriastradhstruct kgem_bo *kgem_create_map(struct kgem *kgem,
702003b705cfSriastradh				void *ptr, uint32_t size,
702103b705cfSriastradh				bool read_only)
702203b705cfSriastradh{
702303b705cfSriastradh	struct kgem_bo *bo;
702403b705cfSriastradh	uintptr_t first_page, last_page;
702503b705cfSriastradh	uint32_t handle;
702603b705cfSriastradh
702703b705cfSriastradh	assert(MAP(ptr) == ptr);
702803b705cfSriastradh
70299a906b70Schristos	DBG(("%s(%p size=%d, read-only?=%d) - has_userptr?=%d\n", __FUNCTION__,
70309a906b70Schristos	     ptr, size, read_only, kgem->has_userptr));
703103b705cfSriastradh	if (!kgem->has_userptr)
703203b705cfSriastradh		return NULL;
703303b705cfSriastradh
703403b705cfSriastradh	first_page = (uintptr_t)ptr;
703503b705cfSriastradh	last_page = first_page + size + PAGE_SIZE - 1;
703603b705cfSriastradh
703763ef14f0Smrg	first_page &= ~(uintptr_t)(PAGE_SIZE-1);
703863ef14f0Smrg	last_page &= ~(uintptr_t)(PAGE_SIZE-1);
703903b705cfSriastradh	assert(last_page > first_page);
704003b705cfSriastradh
704103b705cfSriastradh	handle = gem_userptr(kgem->fd,
704203b705cfSriastradh			     (void *)first_page, last_page-first_page,
704303b705cfSriastradh			     read_only);
70449a906b70Schristos	if (handle == 0) {
704563ef14f0Smrg		if (read_only && kgem->has_wc_mmap) {
704663ef14f0Smrg			struct drm_i915_gem_set_domain set_domain;
704763ef14f0Smrg
704863ef14f0Smrg			handle = gem_userptr(kgem->fd,
704963ef14f0Smrg					     (void *)first_page, last_page-first_page,
705063ef14f0Smrg					     false);
705163ef14f0Smrg
705263ef14f0Smrg			VG_CLEAR(set_domain);
705363ef14f0Smrg			set_domain.handle = handle;
705463ef14f0Smrg			set_domain.read_domains = I915_GEM_DOMAIN_GTT;
705563ef14f0Smrg			set_domain.write_domain = 0;
705663ef14f0Smrg			if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) {
705763ef14f0Smrg				gem_close(kgem->fd, handle);
705863ef14f0Smrg				handle = 0;
705963ef14f0Smrg			}
706063ef14f0Smrg		}
706163ef14f0Smrg		if (handle == 0) {
706263ef14f0Smrg			DBG(("%s: import failed, errno=%d\n", __FUNCTION__, errno));
706363ef14f0Smrg			return NULL;
706463ef14f0Smrg		}
70659a906b70Schristos	}
706603b705cfSriastradh
706703b705cfSriastradh	bo = __kgem_bo_alloc(handle, (last_page - first_page) / PAGE_SIZE);
706803b705cfSriastradh	if (bo == NULL) {
706903b705cfSriastradh		gem_close(kgem->fd, handle);
707003b705cfSriastradh		return NULL;
707103b705cfSriastradh	}
707203b705cfSriastradh
70739a906b70Schristos	bo->unique_id = kgem_get_unique_id(kgem);
707403b705cfSriastradh	bo->snoop = !kgem->has_llc;
707503b705cfSriastradh	debug_alloc__bo(kgem, bo);
707603b705cfSriastradh
707703b705cfSriastradh	if (first_page != (uintptr_t)ptr) {
707803b705cfSriastradh		struct kgem_bo *proxy;
707903b705cfSriastradh
708003b705cfSriastradh		proxy = kgem_create_proxy(kgem, bo,
708103b705cfSriastradh					  (uintptr_t)ptr - first_page, size);
708203b705cfSriastradh		kgem_bo_destroy(kgem, bo);
708303b705cfSriastradh		if (proxy == NULL)
708403b705cfSriastradh			return NULL;
708503b705cfSriastradh
708603b705cfSriastradh		bo = proxy;
708703b705cfSriastradh	}
708803b705cfSriastradh
70899a906b70Schristos	bo->map__cpu = MAKE_USER_MAP(ptr);
709003b705cfSriastradh
709103b705cfSriastradh	DBG(("%s(ptr=%p, size=%d, pages=%d, read_only=%d) => handle=%d (proxy? %d)\n",
709203b705cfSriastradh	     __FUNCTION__, ptr, size, NUM_PAGES(size), read_only, handle, bo->proxy != NULL));
709303b705cfSriastradh	return bo;
709403b705cfSriastradh}
709503b705cfSriastradh
709603b705cfSriastradhvoid kgem_bo_sync__cpu(struct kgem *kgem, struct kgem_bo *bo)
709703b705cfSriastradh{
709803b705cfSriastradh	DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle));
709903b705cfSriastradh	assert(!bo->scanout);
71009a906b70Schristos	assert_tiling(kgem, bo);
71019a906b70Schristos
710203b705cfSriastradh	kgem_bo_submit(kgem, bo);
710303b705cfSriastradh
710403b705cfSriastradh	/* SHM pixmaps use proxies for subpage offsets */
710503b705cfSriastradh	assert(!bo->purged);
710603b705cfSriastradh	while (bo->proxy)
710703b705cfSriastradh		bo = bo->proxy;
710803b705cfSriastradh	assert(!bo->purged);
710903b705cfSriastradh
711003b705cfSriastradh	if (bo->domain != DOMAIN_CPU || FORCE_MMAP_SYNC & (1 << DOMAIN_CPU)) {
711103b705cfSriastradh		struct drm_i915_gem_set_domain set_domain;
711203b705cfSriastradh
711303b705cfSriastradh		DBG(("%s: SYNC: handle=%d, needs_flush? %d, domain? %d, busy? %d\n",
711403b705cfSriastradh		     __FUNCTION__, bo->handle,
711503b705cfSriastradh		     bo->needs_flush, bo->domain,
711603b705cfSriastradh		     __kgem_busy(kgem, bo->handle)));
711703b705cfSriastradh
711803b705cfSriastradh		VG_CLEAR(set_domain);
711903b705cfSriastradh		set_domain.handle = bo->handle;
712003b705cfSriastradh		set_domain.read_domains = I915_GEM_DOMAIN_CPU;
712103b705cfSriastradh		set_domain.write_domain = I915_GEM_DOMAIN_CPU;
712203b705cfSriastradh
71239a906b70Schristos		if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) {
71249a906b70Schristos			DBG(("%s: sync: GPU hang detected\n", __FUNCTION__));
71259a906b70Schristos			kgem_throttle(kgem);
712603b705cfSriastradh		}
712763ef14f0Smrg		bo->needs_flush = false;
71289a906b70Schristos		kgem_bo_retire(kgem, bo);
71299a906b70Schristos		bo->domain = DOMAIN_CPU;
713063ef14f0Smrg		bo->gtt_dirty = true;
713103b705cfSriastradh	}
713203b705cfSriastradh}
713303b705cfSriastradh
713403b705cfSriastradhvoid kgem_bo_sync__cpu_full(struct kgem *kgem, struct kgem_bo *bo, bool write)
713503b705cfSriastradh{
713603b705cfSriastradh	DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle));
713703b705cfSriastradh	assert(!bo->scanout || !write);
71389a906b70Schristos	assert_tiling(kgem, bo);
713903b705cfSriastradh
714003b705cfSriastradh	if (write || bo->needs_flush)
714103b705cfSriastradh		kgem_bo_submit(kgem, bo);
714203b705cfSriastradh
714303b705cfSriastradh	/* SHM pixmaps use proxies for subpage offsets */
714403b705cfSriastradh	assert(!bo->purged);
714503b705cfSriastradh	assert(bo->refcnt);
714603b705cfSriastradh	while (bo->proxy)
714703b705cfSriastradh		bo = bo->proxy;
714803b705cfSriastradh	assert(bo->refcnt);
714903b705cfSriastradh	assert(!bo->purged);
715003b705cfSriastradh
715163ef14f0Smrg	if (bo->rq == NULL && (kgem->has_llc || bo->snoop) && !write)
715263ef14f0Smrg		return;
715363ef14f0Smrg
715403b705cfSriastradh	if (bo->domain != DOMAIN_CPU || FORCE_MMAP_SYNC & (1 << DOMAIN_CPU)) {
715503b705cfSriastradh		struct drm_i915_gem_set_domain set_domain;
715603b705cfSriastradh
715703b705cfSriastradh		DBG(("%s: SYNC: handle=%d, needs_flush? %d, domain? %d, busy? %d\n",
715803b705cfSriastradh		     __FUNCTION__, bo->handle,
715903b705cfSriastradh		     bo->needs_flush, bo->domain,
716003b705cfSriastradh		     __kgem_busy(kgem, bo->handle)));
716103b705cfSriastradh
716203b705cfSriastradh		VG_CLEAR(set_domain);
716303b705cfSriastradh		set_domain.handle = bo->handle;
716403b705cfSriastradh		set_domain.read_domains = I915_GEM_DOMAIN_CPU;
716503b705cfSriastradh		set_domain.write_domain = write ? I915_GEM_DOMAIN_CPU : 0;
716603b705cfSriastradh
71679a906b70Schristos		if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) {
71689a906b70Schristos			DBG(("%s: sync: GPU hang detected\n", __FUNCTION__));
71699a906b70Schristos			kgem_throttle(kgem);
71709a906b70Schristos		}
717163ef14f0Smrg		bo->needs_flush = false;
71729a906b70Schristos		if (write) {
71739a906b70Schristos			kgem_bo_retire(kgem, bo);
71749a906b70Schristos			bo->domain = DOMAIN_CPU;
717563ef14f0Smrg			bo->gtt_dirty = true;
71769a906b70Schristos		} else {
717703b705cfSriastradh			if (bo->exec == NULL)
71789a906b70Schristos				kgem_bo_maybe_retire(kgem, bo);
71799a906b70Schristos			bo->domain = DOMAIN_NONE;
718003b705cfSriastradh		}
718103b705cfSriastradh	}
718203b705cfSriastradh}
718303b705cfSriastradh
718403b705cfSriastradhvoid kgem_bo_sync__gtt(struct kgem *kgem, struct kgem_bo *bo)
718503b705cfSriastradh{
718603b705cfSriastradh	DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle));
718703b705cfSriastradh	assert(bo->refcnt);
718803b705cfSriastradh	assert(bo->proxy == NULL);
71899a906b70Schristos	assert_tiling(kgem, bo);
719063ef14f0Smrg	assert(!bo->snoop);
719103b705cfSriastradh
719203b705cfSriastradh	kgem_bo_submit(kgem, bo);
719303b705cfSriastradh
719463ef14f0Smrg	if (bo->domain != DOMAIN_GTT ||
719563ef14f0Smrg	    !kgem->has_coherent_mmap_gtt ||
719663ef14f0Smrg	    FORCE_MMAP_SYNC & (1 << DOMAIN_GTT)) {
719703b705cfSriastradh		struct drm_i915_gem_set_domain set_domain;
719803b705cfSriastradh
719903b705cfSriastradh		DBG(("%s: SYNC: handle=%d, needs_flush? %d, domain? %d, busy? %d\n",
720003b705cfSriastradh		     __FUNCTION__, bo->handle,
720103b705cfSriastradh		     bo->needs_flush, bo->domain,
720203b705cfSriastradh		     __kgem_busy(kgem, bo->handle)));
720303b705cfSriastradh
720403b705cfSriastradh		VG_CLEAR(set_domain);
720503b705cfSriastradh		set_domain.handle = bo->handle;
720603b705cfSriastradh		set_domain.read_domains = I915_GEM_DOMAIN_GTT;
720703b705cfSriastradh		set_domain.write_domain = I915_GEM_DOMAIN_GTT;
720803b705cfSriastradh
72099a906b70Schristos		if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) {
72109a906b70Schristos			DBG(("%s: sync: GPU hang detected\n", __FUNCTION__));
72119a906b70Schristos			kgem_throttle(kgem);
721203b705cfSriastradh		}
721363ef14f0Smrg		bo->needs_flush = false;
72149a906b70Schristos		kgem_bo_retire(kgem, bo);
72159a906b70Schristos		bo->domain = DOMAIN_GTT;
72169a906b70Schristos		bo->gtt_dirty = true;
721703b705cfSriastradh	}
721803b705cfSriastradh}
721903b705cfSriastradh
722003b705cfSriastradhvoid kgem_clear_dirty(struct kgem *kgem)
722103b705cfSriastradh{
722203b705cfSriastradh	struct list * const buffers = &kgem->next_request->buffers;
722303b705cfSriastradh	struct kgem_bo *bo;
722403b705cfSriastradh
722503b705cfSriastradh	list_for_each_entry(bo, buffers, request) {
722603b705cfSriastradh		if (!bo->gpu_dirty)
722703b705cfSriastradh			break;
722803b705cfSriastradh
722903b705cfSriastradh		bo->gpu_dirty = false;
723003b705cfSriastradh	}
723103b705cfSriastradh}
723203b705cfSriastradh
723303b705cfSriastradhstruct kgem_bo *kgem_create_proxy(struct kgem *kgem,
723403b705cfSriastradh				  struct kgem_bo *target,
723503b705cfSriastradh				  int offset, int length)
723603b705cfSriastradh{
723703b705cfSriastradh	struct kgem_bo *bo;
723803b705cfSriastradh
723903b705cfSriastradh	DBG(("%s: target handle=%d [proxy? %d], offset=%d, length=%d, io=%d\n",
724003b705cfSriastradh	     __FUNCTION__, target->handle, target->proxy ? target->proxy->delta : -1,
724103b705cfSriastradh	     offset, length, target->io));
724203b705cfSriastradh
724303b705cfSriastradh	bo = __kgem_bo_alloc(target->handle, length);
724403b705cfSriastradh	if (bo == NULL)
724503b705cfSriastradh		return NULL;
724603b705cfSriastradh
724703b705cfSriastradh	bo->unique_id = kgem_get_unique_id(kgem);
724803b705cfSriastradh	bo->reusable = false;
724903b705cfSriastradh	bo->size.bytes = length;
725003b705cfSriastradh
725103b705cfSriastradh	bo->io = target->io && target->proxy == NULL;
725203b705cfSriastradh	bo->gpu_dirty = target->gpu_dirty;
725303b705cfSriastradh	bo->tiling = target->tiling;
725403b705cfSriastradh	bo->pitch = target->pitch;
725503b705cfSriastradh	bo->flush = target->flush;
725603b705cfSriastradh	bo->snoop = target->snoop;
725703b705cfSriastradh
725803b705cfSriastradh	assert(!bo->scanout);
725903b705cfSriastradh	bo->proxy = kgem_bo_reference(target);
726003b705cfSriastradh	bo->delta = offset;
726103b705cfSriastradh
72629a906b70Schristos	/* Proxies are only tracked for busyness on the current rq */
72639a906b70Schristos	if (target->exec && !bo->io) {
72649a906b70Schristos		assert(RQ(target->rq) == kgem->next_request);
726503b705cfSriastradh		list_move_tail(&bo->request, &kgem->next_request->buffers);
726603b705cfSriastradh		bo->exec = &_kgem_dummy_exec;
72679a906b70Schristos		bo->rq = target->rq;
726803b705cfSriastradh	}
726903b705cfSriastradh
727003b705cfSriastradh	return bo;
727103b705cfSriastradh}
727203b705cfSriastradh
727303b705cfSriastradhstatic struct kgem_buffer *
727403b705cfSriastradhbuffer_alloc(void)
727503b705cfSriastradh{
727603b705cfSriastradh	struct kgem_buffer *bo;
727703b705cfSriastradh
727803b705cfSriastradh	bo = malloc(sizeof(*bo));
727903b705cfSriastradh	if (bo == NULL)
728003b705cfSriastradh		return NULL;
728103b705cfSriastradh
728203b705cfSriastradh	bo->mem = NULL;
728303b705cfSriastradh	bo->need_io = false;
72849a906b70Schristos	bo->mmapped = MMAPPED_CPU;
728503b705cfSriastradh
728603b705cfSriastradh	return bo;
728703b705cfSriastradh}
728803b705cfSriastradh
728903b705cfSriastradhstatic struct kgem_buffer *
729003b705cfSriastradhbuffer_alloc_with_data(int num_pages)
729103b705cfSriastradh{
729203b705cfSriastradh	struct kgem_buffer *bo;
729303b705cfSriastradh
729403b705cfSriastradh	bo = malloc(sizeof(*bo) + 2*UPLOAD_ALIGNMENT + num_pages * PAGE_SIZE);
729503b705cfSriastradh	if (bo == NULL)
729603b705cfSriastradh		return NULL;
729703b705cfSriastradh
729803b705cfSriastradh	bo->mem = (void *)ALIGN((uintptr_t)bo + sizeof(*bo), UPLOAD_ALIGNMENT);
729903b705cfSriastradh	bo->mmapped = false;
730003b705cfSriastradh	return bo;
730103b705cfSriastradh}
730203b705cfSriastradh
730303b705cfSriastradhstatic inline bool
730403b705cfSriastradhuse_snoopable_buffer(struct kgem *kgem, uint32_t flags)
730503b705cfSriastradh{
730603b705cfSriastradh	if ((flags & KGEM_BUFFER_WRITE) == 0)
730703b705cfSriastradh		return kgem->gen >= 030;
730803b705cfSriastradh
730903b705cfSriastradh	return true;
731003b705cfSriastradh}
731103b705cfSriastradh
731203b705cfSriastradhstatic void
731303b705cfSriastradhinit_buffer_from_bo(struct kgem_buffer *bo, struct kgem_bo *old)
731403b705cfSriastradh{
731503b705cfSriastradh	DBG(("%s: reusing handle=%d for buffer\n",
731603b705cfSriastradh	     __FUNCTION__, old->handle));
731703b705cfSriastradh
731803b705cfSriastradh	assert(old->proxy == NULL);
7319813957e3Ssnj	assert(list_is_empty(&old->list));
732003b705cfSriastradh
732103b705cfSriastradh	memcpy(&bo->base, old, sizeof(*old));
732203b705cfSriastradh	if (old->rq)
732303b705cfSriastradh		list_replace(&old->request, &bo->base.request);
732403b705cfSriastradh	else
732503b705cfSriastradh		list_init(&bo->base.request);
732603b705cfSriastradh	list_replace(&old->vma, &bo->base.vma);
732703b705cfSriastradh	list_init(&bo->base.list);
732803b705cfSriastradh	free(old);
732903b705cfSriastradh
733003b705cfSriastradh	assert(bo->base.tiling == I915_TILING_NONE);
733103b705cfSriastradh
733203b705cfSriastradh	bo->base.refcnt = 1;
733303b705cfSriastradh}
733403b705cfSriastradh
733503b705cfSriastradhstatic struct kgem_buffer *
733603b705cfSriastradhsearch_snoopable_buffer(struct kgem *kgem, unsigned alloc)
733703b705cfSriastradh{
733803b705cfSriastradh	struct kgem_buffer *bo;
733903b705cfSriastradh	struct kgem_bo *old;
734003b705cfSriastradh
734103b705cfSriastradh	old = search_snoop_cache(kgem, alloc, 0);
734203b705cfSriastradh	if (old) {
734303b705cfSriastradh		if (!old->io) {
734403b705cfSriastradh			bo = buffer_alloc();
734503b705cfSriastradh			if (bo == NULL)
734603b705cfSriastradh				return NULL;
734703b705cfSriastradh
734803b705cfSriastradh			init_buffer_from_bo(bo, old);
734903b705cfSriastradh		} else {
735003b705cfSriastradh			bo = (struct kgem_buffer *)old;
735103b705cfSriastradh			bo->base.refcnt = 1;
735203b705cfSriastradh		}
735303b705cfSriastradh
735403b705cfSriastradh		DBG(("%s: created CPU handle=%d for buffer, size %d\n",
735503b705cfSriastradh		     __FUNCTION__, bo->base.handle, num_pages(&bo->base)));
735603b705cfSriastradh
735703b705cfSriastradh		assert(bo->base.snoop);
735803b705cfSriastradh		assert(bo->base.tiling == I915_TILING_NONE);
735903b705cfSriastradh		assert(num_pages(&bo->base) >= alloc);
73609a906b70Schristos		assert(bo->mmapped == MMAPPED_CPU);
736103b705cfSriastradh		assert(bo->need_io == false);
736203b705cfSriastradh
736303b705cfSriastradh		bo->mem = kgem_bo_map__cpu(kgem, &bo->base);
736403b705cfSriastradh		if (bo->mem == NULL) {
736503b705cfSriastradh			bo->base.refcnt = 0;
736603b705cfSriastradh			kgem_bo_free(kgem, &bo->base);
736703b705cfSriastradh			bo = NULL;
736803b705cfSriastradh		}
736903b705cfSriastradh
737003b705cfSriastradh		return bo;
737103b705cfSriastradh	}
737203b705cfSriastradh
737303b705cfSriastradh	return NULL;
737403b705cfSriastradh}
737503b705cfSriastradh
737603b705cfSriastradhstatic struct kgem_buffer *
737703b705cfSriastradhcreate_snoopable_buffer(struct kgem *kgem, unsigned alloc)
737803b705cfSriastradh{
737903b705cfSriastradh	struct kgem_buffer *bo;
738003b705cfSriastradh	uint32_t handle;
738103b705cfSriastradh
738203b705cfSriastradh	if (kgem->has_llc) {
738303b705cfSriastradh		struct kgem_bo *old;
738403b705cfSriastradh
738503b705cfSriastradh		bo = buffer_alloc();
738603b705cfSriastradh		if (bo == NULL)
738703b705cfSriastradh			return NULL;
738803b705cfSriastradh
738903b705cfSriastradh		old = search_linear_cache(kgem, alloc,
739003b705cfSriastradh					 CREATE_INACTIVE | CREATE_CPU_MAP | CREATE_EXACT);
739103b705cfSriastradh		if (old) {
739203b705cfSriastradh			init_buffer_from_bo(bo, old);
739303b705cfSriastradh		} else {
739403b705cfSriastradh			handle = gem_create(kgem->fd, alloc);
739503b705cfSriastradh			if (handle == 0) {
739603b705cfSriastradh				free(bo);
739703b705cfSriastradh				return NULL;
739803b705cfSriastradh			}
739903b705cfSriastradh
740003b705cfSriastradh			__kgem_bo_init(&bo->base, handle, alloc);
74019a906b70Schristos			debug_alloc__bo(kgem, &bo->base);
740203b705cfSriastradh			DBG(("%s: created CPU (LLC) handle=%d for buffer, size %d\n",
740303b705cfSriastradh			     __FUNCTION__, bo->base.handle, alloc));
740403b705cfSriastradh		}
740503b705cfSriastradh
740603b705cfSriastradh		assert(bo->base.refcnt == 1);
74079a906b70Schristos		assert(bo->mmapped == MMAPPED_CPU);
740803b705cfSriastradh		assert(bo->need_io == false);
740903b705cfSriastradh
741003b705cfSriastradh		bo->mem = kgem_bo_map__cpu(kgem, &bo->base);
741103b705cfSriastradh		if (bo->mem != NULL)
741203b705cfSriastradh			return bo;
741303b705cfSriastradh
741403b705cfSriastradh		bo->base.refcnt = 0; /* for valgrind */
741503b705cfSriastradh		kgem_bo_free(kgem, &bo->base);
741603b705cfSriastradh	}
741703b705cfSriastradh
741803b705cfSriastradh	if (kgem->has_caching) {
741903b705cfSriastradh		struct kgem_bo *old;
742003b705cfSriastradh
742103b705cfSriastradh		bo = buffer_alloc();
742203b705cfSriastradh		if (bo == NULL)
742303b705cfSriastradh			return NULL;
742403b705cfSriastradh
742503b705cfSriastradh		old = search_linear_cache(kgem, alloc,
742603b705cfSriastradh					 CREATE_INACTIVE | CREATE_CPU_MAP | CREATE_EXACT);
742703b705cfSriastradh		if (old) {
742803b705cfSriastradh			init_buffer_from_bo(bo, old);
742903b705cfSriastradh		} else {
743003b705cfSriastradh			handle = gem_create(kgem->fd, alloc);
743103b705cfSriastradh			if (handle == 0) {
743203b705cfSriastradh				free(bo);
743303b705cfSriastradh				return NULL;
743403b705cfSriastradh			}
743503b705cfSriastradh
743603b705cfSriastradh			__kgem_bo_init(&bo->base, handle, alloc);
74379a906b70Schristos			debug_alloc__bo(kgem, &bo->base);
743803b705cfSriastradh			DBG(("%s: created CPU handle=%d for buffer, size %d\n",
743903b705cfSriastradh			     __FUNCTION__, bo->base.handle, alloc));
744003b705cfSriastradh		}
744103b705cfSriastradh
744203b705cfSriastradh		assert(bo->base.refcnt == 1);
74439a906b70Schristos		assert(bo->mmapped == MMAPPED_CPU);
744403b705cfSriastradh		assert(bo->need_io == false);
7445813957e3Ssnj		assert(!__kgem_busy(kgem, bo->base.handle));
744603b705cfSriastradh
744703b705cfSriastradh		if (!gem_set_caching(kgem->fd, bo->base.handle, SNOOPED))
744803b705cfSriastradh			goto free_caching;
744903b705cfSriastradh
745003b705cfSriastradh		bo->base.snoop = true;
745103b705cfSriastradh
745203b705cfSriastradh		bo->mem = kgem_bo_map__cpu(kgem, &bo->base);
745303b705cfSriastradh		if (bo->mem == NULL)
745403b705cfSriastradh			goto free_caching;
745503b705cfSriastradh
745603b705cfSriastradh		return bo;
745703b705cfSriastradh
745803b705cfSriastradhfree_caching:
745903b705cfSriastradh		bo->base.refcnt = 0; /* for valgrind */
746003b705cfSriastradh		kgem_bo_free(kgem, &bo->base);
746103b705cfSriastradh	}
746203b705cfSriastradh
746303b705cfSriastradh	if (kgem->has_userptr) {
746403b705cfSriastradh		bo = buffer_alloc();
746503b705cfSriastradh		if (bo == NULL)
746603b705cfSriastradh			return NULL;
746703b705cfSriastradh
746803b705cfSriastradh		//if (posix_memalign(&ptr, 64, ALIGN(size, 64)))
746903b705cfSriastradh		if (posix_memalign(&bo->mem, PAGE_SIZE, alloc * PAGE_SIZE)) {
747003b705cfSriastradh			free(bo);
747103b705cfSriastradh			return NULL;
747203b705cfSriastradh		}
747303b705cfSriastradh
747403b705cfSriastradh		handle = gem_userptr(kgem->fd, bo->mem, alloc * PAGE_SIZE, false);
747503b705cfSriastradh		if (handle == 0) {
747603b705cfSriastradh			free(bo->mem);
747703b705cfSriastradh			free(bo);
747803b705cfSriastradh			return NULL;
747903b705cfSriastradh		}
748003b705cfSriastradh
748103b705cfSriastradh		__kgem_bo_init(&bo->base, handle, alloc);
74829a906b70Schristos		debug_alloc__bo(kgem, &bo->base);
748303b705cfSriastradh		DBG(("%s: created snoop handle=%d for buffer\n",
748403b705cfSriastradh		     __FUNCTION__, bo->base.handle));
748503b705cfSriastradh
74869a906b70Schristos		assert(bo->mmapped == MMAPPED_CPU);
748703b705cfSriastradh		assert(bo->need_io == false);
748803b705cfSriastradh
748903b705cfSriastradh		bo->base.refcnt = 1;
749003b705cfSriastradh		bo->base.snoop = true;
74919a906b70Schristos		bo->base.map__cpu = MAKE_USER_MAP(bo->mem);
749203b705cfSriastradh
749303b705cfSriastradh		return bo;
749403b705cfSriastradh	}
749503b705cfSriastradh
749603b705cfSriastradh	return NULL;
749703b705cfSriastradh}
749803b705cfSriastradh
749903b705cfSriastradhstruct kgem_bo *kgem_create_buffer(struct kgem *kgem,
750003b705cfSriastradh				   uint32_t size, uint32_t flags,
750103b705cfSriastradh				   void **ret)
750203b705cfSriastradh{
750303b705cfSriastradh	struct kgem_buffer *bo;
750403b705cfSriastradh	unsigned offset, alloc;
750503b705cfSriastradh	struct kgem_bo *old;
750603b705cfSriastradh
750703b705cfSriastradh	DBG(("%s: size=%d, flags=%x [write?=%d, inplace?=%d, last?=%d]\n",
750803b705cfSriastradh	     __FUNCTION__, size, flags,
750903b705cfSriastradh	     !!(flags & KGEM_BUFFER_WRITE),
751003b705cfSriastradh	     !!(flags & KGEM_BUFFER_INPLACE),
751103b705cfSriastradh	     !!(flags & KGEM_BUFFER_LAST)));
751203b705cfSriastradh	assert(size);
751303b705cfSriastradh	/* we should never be asked to create anything TOO large */
751403b705cfSriastradh	assert(size <= kgem->max_object_size);
751503b705cfSriastradh
751603b705cfSriastradh#if !DBG_NO_UPLOAD_CACHE
751703b705cfSriastradh	list_for_each_entry(bo, &kgem->batch_buffers, base.list) {
751803b705cfSriastradh		assert(bo->base.io);
751903b705cfSriastradh		assert(bo->base.refcnt >= 1);
752003b705cfSriastradh
752103b705cfSriastradh		/* We can reuse any write buffer which we can fit */
752203b705cfSriastradh		if (flags == KGEM_BUFFER_LAST &&
752303b705cfSriastradh		    bo->write == KGEM_BUFFER_WRITE &&
75249a906b70Schristos		    bo->base.refcnt == 1 &&
75259a906b70Schristos		    bo->mmapped == MMAPPED_NONE &&
752603b705cfSriastradh		    size <= bytes(&bo->base)) {
752703b705cfSriastradh			DBG(("%s: reusing write buffer for read of %d bytes? used=%d, total=%d\n",
752803b705cfSriastradh			     __FUNCTION__, size, bo->used, bytes(&bo->base)));
75299a906b70Schristos			gem_write__cachealigned(kgem->fd, bo->base.handle,
75309a906b70Schristos						0, bo->used, bo->mem);
75319a906b70Schristos			assert(list_is_empty(&bo->base.vma));
753203b705cfSriastradh			bo->need_io = 0;
753303b705cfSriastradh			bo->write = 0;
753403b705cfSriastradh			offset = 0;
753503b705cfSriastradh			bo->used = size;
753603b705cfSriastradh			goto done;
753703b705cfSriastradh		}
753803b705cfSriastradh
753903b705cfSriastradh		if (flags & KGEM_BUFFER_WRITE) {
754003b705cfSriastradh			if ((bo->write & KGEM_BUFFER_WRITE) == 0 ||
754103b705cfSriastradh			    (((bo->write & ~flags) & KGEM_BUFFER_INPLACE) &&
754203b705cfSriastradh			     !bo->base.snoop)) {
754303b705cfSriastradh				DBG(("%s: skip write %x buffer, need %x\n",
754403b705cfSriastradh				     __FUNCTION__, bo->write, flags));
754503b705cfSriastradh				continue;
754603b705cfSriastradh			}
754703b705cfSriastradh			assert(bo->mmapped || bo->need_io);
754803b705cfSriastradh		} else {
754903b705cfSriastradh			if (bo->write & KGEM_BUFFER_WRITE) {
755003b705cfSriastradh				DBG(("%s: skip write %x buffer, need %x\n",
755103b705cfSriastradh				     __FUNCTION__, bo->write, flags));
755203b705cfSriastradh				continue;
755303b705cfSriastradh			}
755403b705cfSriastradh		}
755503b705cfSriastradh
755603b705cfSriastradh		if (bo->used + size <= bytes(&bo->base)) {
755703b705cfSriastradh			DBG(("%s: reusing buffer? used=%d + size=%d, total=%d\n",
755803b705cfSriastradh			     __FUNCTION__, bo->used, size, bytes(&bo->base)));
755903b705cfSriastradh			offset = bo->used;
756003b705cfSriastradh			bo->used += size;
756103b705cfSriastradh			goto done;
756203b705cfSriastradh		}
756303b705cfSriastradh	}
756403b705cfSriastradh
756503b705cfSriastradh	if (flags & KGEM_BUFFER_WRITE) {
756603b705cfSriastradh		list_for_each_entry(bo, &kgem->active_buffers, base.list) {
756703b705cfSriastradh			assert(bo->base.io);
756803b705cfSriastradh			assert(bo->base.refcnt >= 1);
75699a906b70Schristos			assert(bo->base.exec == NULL);
757003b705cfSriastradh			assert(bo->mmapped);
75719a906b70Schristos			assert(bo->mmapped == MMAPPED_GTT || kgem->has_llc || bo->base.snoop);
757203b705cfSriastradh
75739a906b70Schristos			if ((bo->write & ~flags) & KGEM_BUFFER_INPLACE && !bo->base.snoop) {
757403b705cfSriastradh				DBG(("%s: skip write %x buffer, need %x\n",
757503b705cfSriastradh				     __FUNCTION__, bo->write, flags));
757603b705cfSriastradh				continue;
757703b705cfSriastradh			}
757803b705cfSriastradh
757903b705cfSriastradh			if (bo->used + size <= bytes(&bo->base)) {
758003b705cfSriastradh				DBG(("%s: reusing buffer? used=%d + size=%d, total=%d\n",
758103b705cfSriastradh				     __FUNCTION__, bo->used, size, bytes(&bo->base)));
758203b705cfSriastradh				offset = bo->used;
758303b705cfSriastradh				bo->used += size;
758403b705cfSriastradh				list_move(&bo->base.list, &kgem->batch_buffers);
758503b705cfSriastradh				goto done;
758603b705cfSriastradh			}
75879a906b70Schristos
75889a906b70Schristos			if (bo->base.refcnt == 1 &&
75899a906b70Schristos			    size <= bytes(&bo->base) &&
75909a906b70Schristos			    (bo->base.rq == NULL ||
75919a906b70Schristos			     !__kgem_busy(kgem, bo->base.handle))) {
75929a906b70Schristos				DBG(("%s: reusing whole buffer? size=%d, total=%d\n",
75939a906b70Schristos				     __FUNCTION__, size, bytes(&bo->base)));
75949a906b70Schristos				__kgem_bo_clear_busy(&bo->base);
75959a906b70Schristos				assert(list_is_empty(&bo->base.vma));
75969a906b70Schristos
75979a906b70Schristos				switch (bo->mmapped) {
75989a906b70Schristos				case MMAPPED_CPU:
75999a906b70Schristos					kgem_bo_sync__cpu(kgem, &bo->base);
76009a906b70Schristos					break;
76019a906b70Schristos				case MMAPPED_GTT:
76029a906b70Schristos					kgem_bo_sync__gtt(kgem, &bo->base);
76039a906b70Schristos					break;
76049a906b70Schristos				}
76059a906b70Schristos
76069a906b70Schristos				offset = 0;
76079a906b70Schristos				bo->used = size;
76089a906b70Schristos				list_move(&bo->base.list, &kgem->batch_buffers);
76099a906b70Schristos				goto done;
76109a906b70Schristos			}
761103b705cfSriastradh		}
761203b705cfSriastradh	}
761303b705cfSriastradh#endif
761403b705cfSriastradh
761503b705cfSriastradh#if !DBG_NO_MAP_UPLOAD
761603b705cfSriastradh	/* Be a little more generous and hope to hold fewer mmappings */
761703b705cfSriastradh	alloc = ALIGN(2*size, kgem->buffer_size);
761803b705cfSriastradh	if (alloc > MAX_CACHE_SIZE)
761903b705cfSriastradh		alloc = ALIGN(size, kgem->buffer_size);
762003b705cfSriastradh	if (alloc > MAX_CACHE_SIZE)
762103b705cfSriastradh		alloc = PAGE_ALIGN(size);
762203b705cfSriastradh	assert(alloc);
762303b705cfSriastradh
76249a906b70Schristos	alloc /= PAGE_SIZE;
7625813957e3Ssnj	if (alloc > kgem->aperture_mappable / 4 && !kgem->has_wc_mmap)
762603b705cfSriastradh		flags &= ~KGEM_BUFFER_INPLACE;
762703b705cfSriastradh
762803b705cfSriastradh	if (kgem->has_llc &&
762903b705cfSriastradh	    (flags & KGEM_BUFFER_WRITE_INPLACE) != KGEM_BUFFER_WRITE_INPLACE) {
763003b705cfSriastradh		bo = buffer_alloc();
763103b705cfSriastradh		if (bo == NULL)
763203b705cfSriastradh			goto skip_llc;
763303b705cfSriastradh
763403b705cfSriastradh		old = NULL;
763503b705cfSriastradh		if ((flags & KGEM_BUFFER_WRITE) == 0)
763603b705cfSriastradh			old = search_linear_cache(kgem, alloc, CREATE_CPU_MAP);
763703b705cfSriastradh		if (old == NULL)
763803b705cfSriastradh			old = search_linear_cache(kgem, alloc, CREATE_INACTIVE | CREATE_CPU_MAP);
763903b705cfSriastradh		if (old == NULL)
764003b705cfSriastradh			old = search_linear_cache(kgem, NUM_PAGES(size), CREATE_INACTIVE | CREATE_CPU_MAP);
764103b705cfSriastradh		if (old) {
764203b705cfSriastradh			DBG(("%s: found LLC handle=%d for buffer\n",
764303b705cfSriastradh			     __FUNCTION__, old->handle));
764403b705cfSriastradh
764503b705cfSriastradh			init_buffer_from_bo(bo, old);
764603b705cfSriastradh		} else {
764703b705cfSriastradh			uint32_t handle = gem_create(kgem->fd, alloc);
764803b705cfSriastradh			if (handle == 0) {
764903b705cfSriastradh				free(bo);
765003b705cfSriastradh				goto skip_llc;
765103b705cfSriastradh			}
765203b705cfSriastradh			__kgem_bo_init(&bo->base, handle, alloc);
76539a906b70Schristos			debug_alloc__bo(kgem, &bo->base);
765403b705cfSriastradh			DBG(("%s: created LLC handle=%d for buffer\n",
765503b705cfSriastradh			     __FUNCTION__, bo->base.handle));
765603b705cfSriastradh		}
765703b705cfSriastradh
765803b705cfSriastradh		assert(bo->mmapped);
765903b705cfSriastradh		assert(!bo->need_io);
766003b705cfSriastradh
766103b705cfSriastradh		bo->mem = kgem_bo_map__cpu(kgem, &bo->base);
766203b705cfSriastradh		if (bo->mem) {
766303b705cfSriastradh			if (flags & KGEM_BUFFER_WRITE)
766403b705cfSriastradh				kgem_bo_sync__cpu(kgem, &bo->base);
766503b705cfSriastradh			flags &= ~KGEM_BUFFER_INPLACE;
766603b705cfSriastradh			goto init;
766703b705cfSriastradh		} else {
766803b705cfSriastradh			bo->base.refcnt = 0; /* for valgrind */
766903b705cfSriastradh			kgem_bo_free(kgem, &bo->base);
767003b705cfSriastradh		}
767103b705cfSriastradh	}
767203b705cfSriastradhskip_llc:
767303b705cfSriastradh
767403b705cfSriastradh	if ((flags & KGEM_BUFFER_WRITE_INPLACE) == KGEM_BUFFER_WRITE_INPLACE) {
767503b705cfSriastradh		/* The issue with using a GTT upload buffer is that we may
767603b705cfSriastradh		 * cause eviction-stalls in order to free up some GTT space.
767703b705cfSriastradh		 * An is-mappable? ioctl could help us detect when we are
767803b705cfSriastradh		 * about to block, or some per-page magic in the kernel.
767903b705cfSriastradh		 *
768003b705cfSriastradh		 * XXX This is especially noticeable on memory constrained
768103b705cfSriastradh		 * devices like gen2 or with relatively slow gpu like i3.
768203b705cfSriastradh		 */
768303b705cfSriastradh		DBG(("%s: searching for an inactive GTT map for upload\n",
768403b705cfSriastradh		     __FUNCTION__));
768503b705cfSriastradh		old = search_linear_cache(kgem, alloc,
768603b705cfSriastradh					  CREATE_EXACT | CREATE_INACTIVE | CREATE_GTT_MAP);
768703b705cfSriastradh#if HAVE_I915_GEM_BUFFER_INFO
768803b705cfSriastradh		if (old) {
768903b705cfSriastradh			struct drm_i915_gem_buffer_info info;
769003b705cfSriastradh
769103b705cfSriastradh			/* An example of such a non-blocking ioctl might work */
769203b705cfSriastradh
769303b705cfSriastradh			VG_CLEAR(info);
769403b705cfSriastradh			info.handle = handle;
76959a906b70Schristos			if (do_ioctl(kgem->fd,
769603b705cfSriastradh				     DRM_IOCTL_I915_GEM_BUFFER_INFO,
769703b705cfSriastradh				     &fino) == 0) {
769803b705cfSriastradh				old->presumed_offset = info.addr;
769903b705cfSriastradh				if ((info.flags & I915_GEM_MAPPABLE) == 0) {
770003b705cfSriastradh					kgem_bo_move_to_inactive(kgem, old);
770103b705cfSriastradh					old = NULL;
770203b705cfSriastradh				}
770303b705cfSriastradh			}
770403b705cfSriastradh		}
770503b705cfSriastradh#endif
770603b705cfSriastradh		if (old == NULL)
770703b705cfSriastradh			old = search_linear_cache(kgem, NUM_PAGES(size),
770803b705cfSriastradh						  CREATE_EXACT | CREATE_INACTIVE | CREATE_GTT_MAP);
770903b705cfSriastradh		if (old == NULL) {
771003b705cfSriastradh			old = search_linear_cache(kgem, alloc, CREATE_INACTIVE);
77119a906b70Schristos			if (old && !kgem_bo_can_map(kgem, old)) {
771203b705cfSriastradh				_kgem_bo_destroy(kgem, old);
771303b705cfSriastradh				old = NULL;
771403b705cfSriastradh			}
771503b705cfSriastradh		}
771603b705cfSriastradh		if (old) {
771703b705cfSriastradh			DBG(("%s: reusing handle=%d for buffer\n",
771803b705cfSriastradh			     __FUNCTION__, old->handle));
77199a906b70Schristos			assert(kgem_bo_can_map(kgem, old));
772003b705cfSriastradh			assert(!old->snoop);
772103b705cfSriastradh			assert(old->rq == NULL);
772203b705cfSriastradh
772303b705cfSriastradh			bo = buffer_alloc();
772403b705cfSriastradh			if (bo == NULL)
772503b705cfSriastradh				return NULL;
772603b705cfSriastradh
772703b705cfSriastradh			init_buffer_from_bo(bo, old);
772803b705cfSriastradh			assert(num_pages(&bo->base) >= NUM_PAGES(size));
772903b705cfSriastradh
773003b705cfSriastradh			assert(bo->mmapped);
773103b705cfSriastradh			assert(bo->base.refcnt == 1);
773203b705cfSriastradh
773303b705cfSriastradh			bo->mem = kgem_bo_map(kgem, &bo->base);
773403b705cfSriastradh			if (bo->mem) {
77359a906b70Schristos				if (bo->mem == MAP(bo->base.map__cpu))
773603b705cfSriastradh					flags &= ~KGEM_BUFFER_INPLACE;
77379a906b70Schristos				else
77389a906b70Schristos					bo->mmapped = MMAPPED_GTT;
773903b705cfSriastradh				goto init;
774003b705cfSriastradh			} else {
774103b705cfSriastradh				bo->base.refcnt = 0;
774203b705cfSriastradh				kgem_bo_free(kgem, &bo->base);
774303b705cfSriastradh			}
774403b705cfSriastradh		}
774503b705cfSriastradh	}
774603b705cfSriastradh#else
774703b705cfSriastradh	flags &= ~KGEM_BUFFER_INPLACE;
774803b705cfSriastradh#endif
774903b705cfSriastradh	/* Be more parsimonious with pwrite/pread/cacheable buffers */
775003b705cfSriastradh	if ((flags & KGEM_BUFFER_INPLACE) == 0)
775103b705cfSriastradh		alloc = NUM_PAGES(size);
775203b705cfSriastradh
775303b705cfSriastradh	if (use_snoopable_buffer(kgem, flags)) {
775403b705cfSriastradh		bo = search_snoopable_buffer(kgem, alloc);
775503b705cfSriastradh		if (bo) {
775603b705cfSriastradh			if (flags & KGEM_BUFFER_WRITE)
775703b705cfSriastradh				kgem_bo_sync__cpu(kgem, &bo->base);
775803b705cfSriastradh			flags &= ~KGEM_BUFFER_INPLACE;
775903b705cfSriastradh			goto init;
776003b705cfSriastradh		}
776103b705cfSriastradh
776203b705cfSriastradh		if ((flags & KGEM_BUFFER_INPLACE) == 0) {
776303b705cfSriastradh			bo = create_snoopable_buffer(kgem, alloc);
776403b705cfSriastradh			if (bo)
776503b705cfSriastradh				goto init;
776603b705cfSriastradh		}
776703b705cfSriastradh	}
776803b705cfSriastradh
776903b705cfSriastradh	flags &= ~KGEM_BUFFER_INPLACE;
777003b705cfSriastradh
777103b705cfSriastradh	old = NULL;
777203b705cfSriastradh	if ((flags & KGEM_BUFFER_WRITE) == 0)
777303b705cfSriastradh		old = search_linear_cache(kgem, alloc, 0);
777403b705cfSriastradh	if (old == NULL)
777503b705cfSriastradh		old = search_linear_cache(kgem, alloc, CREATE_INACTIVE);
777603b705cfSriastradh	if (old) {
777703b705cfSriastradh		DBG(("%s: reusing ordinary handle %d for io\n",
777803b705cfSriastradh		     __FUNCTION__, old->handle));
777903b705cfSriastradh		bo = buffer_alloc_with_data(num_pages(old));
778003b705cfSriastradh		if (bo == NULL)
778103b705cfSriastradh			return NULL;
778203b705cfSriastradh
778303b705cfSriastradh		init_buffer_from_bo(bo, old);
778403b705cfSriastradh		bo->need_io = flags & KGEM_BUFFER_WRITE;
778503b705cfSriastradh	} else {
778603b705cfSriastradh		unsigned hint;
778703b705cfSriastradh
778803b705cfSriastradh		if (use_snoopable_buffer(kgem, flags)) {
778903b705cfSriastradh			bo = create_snoopable_buffer(kgem, alloc);
779003b705cfSriastradh			if (bo)
779103b705cfSriastradh				goto init;
779203b705cfSriastradh		}
779303b705cfSriastradh
779403b705cfSriastradh		bo = buffer_alloc();
779503b705cfSriastradh		if (bo == NULL)
779603b705cfSriastradh			return NULL;
779703b705cfSriastradh
779803b705cfSriastradh		hint = CREATE_INACTIVE;
779903b705cfSriastradh		if (flags & KGEM_BUFFER_WRITE)
780003b705cfSriastradh			hint |= CREATE_CPU_MAP;
780103b705cfSriastradh		old = search_linear_cache(kgem, alloc, hint);
780203b705cfSriastradh		if (old) {
780303b705cfSriastradh			DBG(("%s: reusing handle=%d for buffer\n",
780403b705cfSriastradh			     __FUNCTION__, old->handle));
780503b705cfSriastradh
780603b705cfSriastradh			init_buffer_from_bo(bo, old);
780703b705cfSriastradh		} else {
780803b705cfSriastradh			uint32_t handle = gem_create(kgem->fd, alloc);
780903b705cfSriastradh			if (handle == 0) {
781003b705cfSriastradh				free(bo);
781103b705cfSriastradh				return NULL;
781203b705cfSriastradh			}
781303b705cfSriastradh
781403b705cfSriastradh			DBG(("%s: created handle=%d for buffer\n",
781503b705cfSriastradh			     __FUNCTION__, handle));
781603b705cfSriastradh
781703b705cfSriastradh			__kgem_bo_init(&bo->base, handle, alloc);
78189a906b70Schristos			debug_alloc__bo(kgem, &bo->base);
781903b705cfSriastradh		}
782003b705cfSriastradh
782103b705cfSriastradh		assert(bo->mmapped);
782203b705cfSriastradh		assert(!bo->need_io);
782303b705cfSriastradh		assert(bo->base.refcnt == 1);
782403b705cfSriastradh
782503b705cfSriastradh		if (flags & KGEM_BUFFER_WRITE) {
782603b705cfSriastradh			bo->mem = kgem_bo_map__cpu(kgem, &bo->base);
782703b705cfSriastradh			if (bo->mem != NULL) {
782803b705cfSriastradh				kgem_bo_sync__cpu(kgem, &bo->base);
782903b705cfSriastradh				goto init;
783003b705cfSriastradh			}
783103b705cfSriastradh		}
783203b705cfSriastradh
783303b705cfSriastradh		DBG(("%s: failing back to new pwrite buffer\n", __FUNCTION__));
783403b705cfSriastradh		old = &bo->base;
783503b705cfSriastradh		bo = buffer_alloc_with_data(num_pages(old));
783603b705cfSriastradh		if (bo == NULL) {
783703b705cfSriastradh			old->refcnt= 0;
783803b705cfSriastradh			kgem_bo_free(kgem, old);
783903b705cfSriastradh			return NULL;
784003b705cfSriastradh		}
784103b705cfSriastradh
784203b705cfSriastradh		init_buffer_from_bo(bo, old);
784303b705cfSriastradh
784403b705cfSriastradh		assert(bo->mem);
784503b705cfSriastradh		assert(!bo->mmapped);
784603b705cfSriastradh		assert(bo->base.refcnt == 1);
784703b705cfSriastradh
784803b705cfSriastradh		bo->need_io = flags & KGEM_BUFFER_WRITE;
784903b705cfSriastradh	}
785003b705cfSriastradhinit:
785103b705cfSriastradh	bo->base.io = true;
785203b705cfSriastradh	assert(bo->base.refcnt == 1);
785303b705cfSriastradh	assert(num_pages(&bo->base) >= NUM_PAGES(size));
785403b705cfSriastradh	assert(!bo->need_io || !bo->base.needs_flush);
785503b705cfSriastradh	assert(!bo->need_io || bo->base.domain != DOMAIN_GPU);
785603b705cfSriastradh	assert(bo->mem);
7857813957e3Ssnj	assert(bo->mmapped != MMAPPED_GTT || bo->base.map__gtt == bo->mem || bo->base.map__wc == bo->mem);
78589a906b70Schristos	assert(bo->mmapped != MMAPPED_CPU || MAP(bo->base.map__cpu) == bo->mem);
785903b705cfSriastradh
786003b705cfSriastradh	bo->used = size;
786103b705cfSriastradh	bo->write = flags & KGEM_BUFFER_WRITE_INPLACE;
786203b705cfSriastradh	offset = 0;
786303b705cfSriastradh
786403b705cfSriastradh	assert(list_is_empty(&bo->base.list));
786503b705cfSriastradh	list_add(&bo->base.list, &kgem->batch_buffers);
786603b705cfSriastradh
786703b705cfSriastradh	DBG(("%s(pages=%d [%d]) new handle=%d, used=%d, write=%d\n",
786803b705cfSriastradh	     __FUNCTION__, num_pages(&bo->base), alloc, bo->base.handle, bo->used, bo->write));
786903b705cfSriastradh
787003b705cfSriastradhdone:
787103b705cfSriastradh	bo->used = ALIGN(bo->used, UPLOAD_ALIGNMENT);
78729a906b70Schristos	assert(bo->used && bo->used <= bytes(&bo->base));
787303b705cfSriastradh	assert(bo->mem);
787403b705cfSriastradh	*ret = (char *)bo->mem + offset;
787503b705cfSriastradh	return kgem_create_proxy(kgem, &bo->base, offset, size);
787603b705cfSriastradh}
787703b705cfSriastradh
787803b705cfSriastradhbool kgem_buffer_is_inplace(struct kgem_bo *_bo)
787903b705cfSriastradh{
788003b705cfSriastradh	struct kgem_buffer *bo = (struct kgem_buffer *)_bo->proxy;
788103b705cfSriastradh	return bo->write & KGEM_BUFFER_WRITE_INPLACE;
788203b705cfSriastradh}
788303b705cfSriastradh
788403b705cfSriastradhstruct kgem_bo *kgem_create_buffer_2d(struct kgem *kgem,
788503b705cfSriastradh				      int width, int height, int bpp,
788603b705cfSriastradh				      uint32_t flags,
788703b705cfSriastradh				      void **ret)
788803b705cfSriastradh{
788903b705cfSriastradh	struct kgem_bo *bo;
789003b705cfSriastradh	int stride;
789103b705cfSriastradh
789203b705cfSriastradh	assert(width > 0 && height > 0);
789303b705cfSriastradh	assert(ret != NULL);
789403b705cfSriastradh	stride = ALIGN(width, 2) * bpp >> 3;
7895813957e3Ssnj	stride = ALIGN(stride, kgem->gen >= 0100 ? 32 : 4);
789603b705cfSriastradh
789703b705cfSriastradh	DBG(("%s: %dx%d, %d bpp, stride=%d\n",
789803b705cfSriastradh	     __FUNCTION__, width, height, bpp, stride));
789903b705cfSriastradh
790003b705cfSriastradh	bo = kgem_create_buffer(kgem, stride * ALIGN(height, 2), flags, ret);
790103b705cfSriastradh	if (bo == NULL) {
790203b705cfSriastradh		DBG(("%s: allocation failure for upload buffer\n",
790303b705cfSriastradh		     __FUNCTION__));
790403b705cfSriastradh		return NULL;
790503b705cfSriastradh	}
790603b705cfSriastradh	assert(*ret != NULL);
790703b705cfSriastradh	assert(bo->proxy != NULL);
790803b705cfSriastradh
790903b705cfSriastradh	if (height & 1) {
791003b705cfSriastradh		struct kgem_buffer *io = (struct kgem_buffer *)bo->proxy;
791103b705cfSriastradh		int min;
791203b705cfSriastradh
791303b705cfSriastradh		assert(io->used);
791403b705cfSriastradh
791503b705cfSriastradh		/* Having padded this surface to ensure that accesses to
791603b705cfSriastradh		 * the last pair of rows is valid, remove the padding so
791703b705cfSriastradh		 * that it can be allocated to other pixmaps.
791803b705cfSriastradh		 */
791903b705cfSriastradh		min = bo->delta + height * stride;
792003b705cfSriastradh		min = ALIGN(min, UPLOAD_ALIGNMENT);
792103b705cfSriastradh		if (io->used != min) {
792203b705cfSriastradh			DBG(("%s: trimming buffer from %d to %d\n",
792303b705cfSriastradh			     __FUNCTION__, io->used, min));
792403b705cfSriastradh			io->used = min;
792503b705cfSriastradh		}
792603b705cfSriastradh		bo->size.bytes -= stride;
792703b705cfSriastradh	}
792803b705cfSriastradh
79299a906b70Schristos	bo->map__cpu = *ret;
793003b705cfSriastradh	bo->pitch = stride;
793103b705cfSriastradh	bo->unique_id = kgem_get_unique_id(kgem);
793203b705cfSriastradh	return bo;
793303b705cfSriastradh}
793403b705cfSriastradh
793503b705cfSriastradhstruct kgem_bo *kgem_upload_source_image(struct kgem *kgem,
793603b705cfSriastradh					 const void *data,
793703b705cfSriastradh					 const BoxRec *box,
793803b705cfSriastradh					 int stride, int bpp)
793903b705cfSriastradh{
794003b705cfSriastradh	int width  = box->x2 - box->x1;
794103b705cfSriastradh	int height = box->y2 - box->y1;
794203b705cfSriastradh	struct kgem_bo *bo;
794303b705cfSriastradh	void *dst;
794403b705cfSriastradh
794503b705cfSriastradh	if (!kgem_can_create_2d(kgem, width, height, bpp))
794603b705cfSriastradh		return NULL;
794703b705cfSriastradh
794803b705cfSriastradh	DBG(("%s : (%d, %d), (%d, %d), stride=%d, bpp=%d\n",
794903b705cfSriastradh	     __FUNCTION__, box->x1, box->y1, box->x2, box->y2, stride, bpp));
795003b705cfSriastradh
795103b705cfSriastradh	assert(data);
795203b705cfSriastradh	assert(width > 0);
795303b705cfSriastradh	assert(height > 0);
795403b705cfSriastradh	assert(stride);
795503b705cfSriastradh	assert(bpp);
795603b705cfSriastradh
795703b705cfSriastradh	bo = kgem_create_buffer_2d(kgem,
795803b705cfSriastradh				   width, height, bpp,
795903b705cfSriastradh				   KGEM_BUFFER_WRITE_INPLACE, &dst);
79609a906b70Schristos	if (bo == NULL)
79619a906b70Schristos		return NULL;
79629a906b70Schristos
79639a906b70Schristos	if (sigtrap_get()) {
79649a906b70Schristos		kgem_bo_destroy(kgem, bo);
79659a906b70Schristos		return NULL;
79669a906b70Schristos	}
79679a906b70Schristos
79689a906b70Schristos	memcpy_blt(data, dst, bpp,
79699a906b70Schristos		   stride, bo->pitch,
79709a906b70Schristos		   box->x1, box->y1,
79719a906b70Schristos		   0, 0,
79729a906b70Schristos		   width, height);
797303b705cfSriastradh
79749a906b70Schristos	sigtrap_put();
797503b705cfSriastradh	return bo;
797603b705cfSriastradh}
797703b705cfSriastradh
797803b705cfSriastradhvoid kgem_proxy_bo_attach(struct kgem_bo *bo,
797903b705cfSriastradh			  struct kgem_bo **ptr)
798003b705cfSriastradh{
798103b705cfSriastradh	DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle));
79829a906b70Schristos	assert(bo->map__gtt == NULL);
798303b705cfSriastradh	assert(bo->proxy);
798403b705cfSriastradh	list_add(&bo->vma, &bo->proxy->vma);
79859a906b70Schristos	bo->map__gtt = ptr;
798603b705cfSriastradh	*ptr = kgem_bo_reference(bo);
798703b705cfSriastradh}
798803b705cfSriastradh
798903b705cfSriastradhvoid kgem_buffer_read_sync(struct kgem *kgem, struct kgem_bo *_bo)
799003b705cfSriastradh{
799103b705cfSriastradh	struct kgem_buffer *bo;
799203b705cfSriastradh	uint32_t offset = _bo->delta, length = _bo->size.bytes;
799303b705cfSriastradh
799403b705cfSriastradh	/* We expect the caller to have already submitted the batch */
799503b705cfSriastradh	assert(_bo->io);
799603b705cfSriastradh	assert(_bo->exec == NULL);
799703b705cfSriastradh	assert(_bo->rq == NULL);
799803b705cfSriastradh	assert(_bo->proxy);
799903b705cfSriastradh
800003b705cfSriastradh	_bo = _bo->proxy;
800103b705cfSriastradh	assert(_bo->proxy == NULL);
800203b705cfSriastradh	assert(_bo->exec == NULL);
800303b705cfSriastradh
800403b705cfSriastradh	bo = (struct kgem_buffer *)_bo;
800503b705cfSriastradh
800603b705cfSriastradh	DBG(("%s(offset=%d, length=%d, snooped=%d)\n", __FUNCTION__,
800703b705cfSriastradh	     offset, length, bo->base.snoop));
800803b705cfSriastradh
800903b705cfSriastradh	if (bo->mmapped) {
801003b705cfSriastradh		struct drm_i915_gem_set_domain set_domain;
801103b705cfSriastradh
801203b705cfSriastradh		DBG(("%s: sync: needs_flush? %d, domain? %d, busy? %d\n",
801303b705cfSriastradh		     __FUNCTION__,
801403b705cfSriastradh		     bo->base.needs_flush,
801503b705cfSriastradh		     bo->base.domain,
801603b705cfSriastradh		     __kgem_busy(kgem, bo->base.handle)));
801703b705cfSriastradh
80189a906b70Schristos		assert(bo->mmapped == MMAPPED_GTT || bo->base.snoop || kgem->has_llc);
801903b705cfSriastradh
802003b705cfSriastradh		VG_CLEAR(set_domain);
802103b705cfSriastradh		set_domain.handle = bo->base.handle;
802203b705cfSriastradh		set_domain.write_domain = 0;
802303b705cfSriastradh		set_domain.read_domains =
80249a906b70Schristos			bo->mmapped == MMAPPED_CPU ? I915_GEM_DOMAIN_CPU : I915_GEM_DOMAIN_GTT;
802503b705cfSriastradh
80269a906b70Schristos		if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) {
80279a906b70Schristos			DBG(("%s: sync: GPU hang detected\n", __FUNCTION__));
80289a906b70Schristos			kgem_throttle(kgem);
80299a906b70Schristos		}
803003b705cfSriastradh	} else {
803103b705cfSriastradh		if (gem_read(kgem->fd,
803203b705cfSriastradh			     bo->base.handle, (char *)bo->mem+offset,
803303b705cfSriastradh			     offset, length))
803403b705cfSriastradh			return;
803503b705cfSriastradh	}
80369a906b70Schristos	kgem_bo_maybe_retire(kgem, &bo->base);
803703b705cfSriastradh	bo->base.domain = DOMAIN_NONE;
803803b705cfSriastradh}
803903b705cfSriastradh
804003b705cfSriastradhuint32_t kgem_bo_get_binding(struct kgem_bo *bo, uint32_t format)
804103b705cfSriastradh{
804203b705cfSriastradh	struct kgem_bo_binding *b;
804303b705cfSriastradh
80449a906b70Schristos	assert(bo->refcnt);
80459a906b70Schristos
804603b705cfSriastradh	for (b = &bo->binding; b && b->offset; b = b->next)
804703b705cfSriastradh		if (format == b->format)
804803b705cfSriastradh			return b->offset;
804903b705cfSriastradh
805003b705cfSriastradh	return 0;
805103b705cfSriastradh}
805203b705cfSriastradh
805303b705cfSriastradhvoid kgem_bo_set_binding(struct kgem_bo *bo, uint32_t format, uint16_t offset)
805403b705cfSriastradh{
805503b705cfSriastradh	struct kgem_bo_binding *b;
805603b705cfSriastradh
80579a906b70Schristos	assert(bo->refcnt);
80589a906b70Schristos
805903b705cfSriastradh	for (b = &bo->binding; b; b = b->next) {
806003b705cfSriastradh		if (b->offset)
806103b705cfSriastradh			continue;
806203b705cfSriastradh
806303b705cfSriastradh		b->offset = offset;
806403b705cfSriastradh		b->format = format;
806503b705cfSriastradh
806603b705cfSriastradh		if (b->next)
806703b705cfSriastradh			b->next->offset = 0;
806803b705cfSriastradh
806903b705cfSriastradh		return;
807003b705cfSriastradh	}
807103b705cfSriastradh
807203b705cfSriastradh	b = malloc(sizeof(*b));
807303b705cfSriastradh	if (b) {
807403b705cfSriastradh		b->next = bo->binding.next;
807503b705cfSriastradh		b->format = format;
807603b705cfSriastradh		b->offset = offset;
807703b705cfSriastradh		bo->binding.next = b;
807803b705cfSriastradh	}
807903b705cfSriastradh}
808003b705cfSriastradh
808103b705cfSriastradhstruct kgem_bo *
808203b705cfSriastradhkgem_replace_bo(struct kgem *kgem,
808303b705cfSriastradh		struct kgem_bo *src,
808403b705cfSriastradh		uint32_t width,
808503b705cfSriastradh		uint32_t height,
808603b705cfSriastradh		uint32_t pitch,
808703b705cfSriastradh		uint32_t bpp)
808803b705cfSriastradh{
808903b705cfSriastradh	struct kgem_bo *dst;
809003b705cfSriastradh	uint32_t br00, br13;
809103b705cfSriastradh	uint32_t handle;
809203b705cfSriastradh	uint32_t size;
809303b705cfSriastradh	uint32_t *b;
809403b705cfSriastradh
809503b705cfSriastradh	DBG(("%s: replacing bo handle=%d, size=%dx%d pitch=%d, with pitch=%d\n",
809603b705cfSriastradh	     __FUNCTION__, src->handle,  width, height, src->pitch, pitch));
809703b705cfSriastradh
809803b705cfSriastradh	/* We only expect to be called to fixup small buffers, hence why
809903b705cfSriastradh	 * we only attempt to allocate a linear bo.
810003b705cfSriastradh	 */
810103b705cfSriastradh	assert(src->tiling == I915_TILING_NONE);
81029a906b70Schristos	assert(kgem_bo_can_blt(kgem, src));
810303b705cfSriastradh
810403b705cfSriastradh	size = height * pitch;
810503b705cfSriastradh	size = NUM_PAGES(size);
810603b705cfSriastradh
810703b705cfSriastradh	dst = search_linear_cache(kgem, size, 0);
810803b705cfSriastradh	if (dst == NULL)
810903b705cfSriastradh		dst = search_linear_cache(kgem, size, CREATE_INACTIVE);
811003b705cfSriastradh	if (dst == NULL) {
811103b705cfSriastradh		handle = gem_create(kgem->fd, size);
811203b705cfSriastradh		if (handle == 0)
811303b705cfSriastradh			return NULL;
811403b705cfSriastradh
811503b705cfSriastradh		dst = __kgem_bo_alloc(handle, size);
811603b705cfSriastradh		if (dst == NULL) {
811703b705cfSriastradh			gem_close(kgem->fd, handle);
811803b705cfSriastradh			return NULL;
811903b705cfSriastradh		}
812003b705cfSriastradh
812103b705cfSriastradh		debug_alloc__bo(kgem, dst);
812203b705cfSriastradh	}
812303b705cfSriastradh	dst->pitch = pitch;
812403b705cfSriastradh	dst->unique_id = kgem_get_unique_id(kgem);
812503b705cfSriastradh	dst->refcnt = 1;
81269a906b70Schristos	assert(dst->tiling == I915_TILING_NONE);
81279a906b70Schristos	assert(kgem_bo_can_blt(kgem, dst));
812803b705cfSriastradh
812903b705cfSriastradh	kgem_set_mode(kgem, KGEM_BLT, dst);
81309a906b70Schristos	if (!kgem_check_batch(kgem, 10) ||
813103b705cfSriastradh	    !kgem_check_reloc(kgem, 2) ||
813203b705cfSriastradh	    !kgem_check_many_bo_fenced(kgem, src, dst, NULL)) {
813303b705cfSriastradh		kgem_submit(kgem);
813403b705cfSriastradh		if (!kgem_check_many_bo_fenced(kgem, src, dst, NULL)) {
813503b705cfSriastradh			kgem_bo_destroy(kgem, dst);
813603b705cfSriastradh			return NULL;
813703b705cfSriastradh		}
813803b705cfSriastradh		_kgem_set_mode(kgem, KGEM_BLT);
813903b705cfSriastradh	}
814063ef14f0Smrg	kgem_bcs_set_tiling(kgem, src, dst);
814103b705cfSriastradh
814203b705cfSriastradh	br00 = XY_SRC_COPY_BLT_CMD;
814303b705cfSriastradh	br13 = pitch;
814403b705cfSriastradh	pitch = src->pitch;
814503b705cfSriastradh	if (kgem->gen >= 040 && src->tiling) {
814603b705cfSriastradh		br00 |= BLT_SRC_TILED;
814703b705cfSriastradh		pitch >>= 2;
814803b705cfSriastradh	}
814903b705cfSriastradh
815003b705cfSriastradh	br13 |= 0xcc << 16;
815103b705cfSriastradh	switch (bpp) {
815203b705cfSriastradh	default:
815303b705cfSriastradh	case 32: br00 |= BLT_WRITE_ALPHA | BLT_WRITE_RGB;
815403b705cfSriastradh		 br13 |= 1 << 25; /* RGB8888 */
815503b705cfSriastradh	case 16: br13 |= 1 << 24; /* RGB565 */
815603b705cfSriastradh	case 8: break;
815703b705cfSriastradh	}
815803b705cfSriastradh
815903b705cfSriastradh	b = kgem->batch + kgem->nbatch;
81609a906b70Schristos	if (kgem->gen >= 0100) {
81619a906b70Schristos		b[0] = br00 | 8;
81629a906b70Schristos		b[1] = br13;
81639a906b70Schristos		b[2] = 0;
81649a906b70Schristos		b[3] = height << 16 | width;
81659a906b70Schristos		*(uint64_t *)(b+4) =
81669a906b70Schristos			kgem_add_reloc64(kgem, kgem->nbatch + 4, dst,
81679a906b70Schristos					 I915_GEM_DOMAIN_RENDER << 16 |
81689a906b70Schristos					 I915_GEM_DOMAIN_RENDER |
81699a906b70Schristos					 KGEM_RELOC_FENCED,
81709a906b70Schristos					 0);
81719a906b70Schristos		b[6] = 0;
81729a906b70Schristos		b[7] = pitch;
81739a906b70Schristos		*(uint64_t *)(b+8) =
81749a906b70Schristos			kgem_add_reloc64(kgem, kgem->nbatch + 8, src,
81759a906b70Schristos					 I915_GEM_DOMAIN_RENDER << 16 |
81769a906b70Schristos					 KGEM_RELOC_FENCED,
81779a906b70Schristos					 0);
81789a906b70Schristos		kgem->nbatch += 10;
81799a906b70Schristos	} else {
81809a906b70Schristos		b[0] = br00 | 6;
81819a906b70Schristos		b[1] = br13;
81829a906b70Schristos		b[2] = 0;
81839a906b70Schristos		b[3] = height << 16 | width;
81849a906b70Schristos		b[4] = kgem_add_reloc(kgem, kgem->nbatch + 4, dst,
81859a906b70Schristos				      I915_GEM_DOMAIN_RENDER << 16 |
81869a906b70Schristos				      I915_GEM_DOMAIN_RENDER |
81879a906b70Schristos				      KGEM_RELOC_FENCED,
81889a906b70Schristos				      0);
81899a906b70Schristos		b[5] = 0;
81909a906b70Schristos		b[6] = pitch;
81919a906b70Schristos		b[7] = kgem_add_reloc(kgem, kgem->nbatch + 7, src,
81929a906b70Schristos				      I915_GEM_DOMAIN_RENDER << 16 |
81939a906b70Schristos				      KGEM_RELOC_FENCED,
81949a906b70Schristos				      0);
81959a906b70Schristos		kgem->nbatch += 8;
81969a906b70Schristos	}
819703b705cfSriastradh
819803b705cfSriastradh	return dst;
819903b705cfSriastradh}
82009a906b70Schristos
82019a906b70Schristosbool kgem_bo_convert_to_gpu(struct kgem *kgem,
82029a906b70Schristos			    struct kgem_bo *bo,
82039a906b70Schristos			    unsigned flags)
82049a906b70Schristos{
8205813957e3Ssnj	DBG(("%s: converting handle=%d from CPU to GPU, flags=%x, busy?=%d\n",
8206813957e3Ssnj	     __FUNCTION__, bo->handle, flags, __kgem_bo_is_busy(kgem, bo)));
82079a906b70Schristos	assert(bo->tiling == I915_TILING_NONE);
82089a906b70Schristos
820963ef14f0Smrg	if (flags & (__MOVE_PRIME | __MOVE_SCANOUT))
821063ef14f0Smrg		return false;
821163ef14f0Smrg
82129a906b70Schristos	if (kgem->has_llc)
82139a906b70Schristos		return true;
82149a906b70Schristos
82159a906b70Schristos	if (flags & MOVE_ASYNC_HINT && __kgem_bo_is_busy(kgem, bo))
82169a906b70Schristos		return false;
82179a906b70Schristos
82189a906b70Schristos	assert(bo->snoop);
82199a906b70Schristos
82209a906b70Schristos	kgem_bo_submit(kgem, bo);
82219a906b70Schristos
82229a906b70Schristos	if (!gem_set_caching(kgem->fd, bo->handle, UNCACHED))
82239a906b70Schristos		return false;
82249a906b70Schristos
82259a906b70Schristos	bo->snoop = false;
82269a906b70Schristos	return true;
82279a906b70Schristos}
8228