103b705cfSriastradh/* 203b705cfSriastradh * Copyright (c) 2011 Intel Corporation 303b705cfSriastradh * 403b705cfSriastradh * Permission is hereby granted, free of charge, to any person obtaining a 503b705cfSriastradh * copy of this software and associated documentation files (the "Software"), 603b705cfSriastradh * to deal in the Software without restriction, including without limitation 703b705cfSriastradh * the rights to use, copy, modify, merge, publish, distribute, sublicense, 803b705cfSriastradh * and/or sell copies of the Software, and to permit persons to whom the 903b705cfSriastradh * Software is furnished to do so, subject to the following conditions: 1003b705cfSriastradh * 1103b705cfSriastradh * The above copyright notice and this permission notice (including the next 1203b705cfSriastradh * paragraph) shall be included in all copies or substantial portions of the 1303b705cfSriastradh * Software. 1403b705cfSriastradh * 1503b705cfSriastradh * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1603b705cfSriastradh * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 1703b705cfSriastradh * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 1803b705cfSriastradh * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 1903b705cfSriastradh * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 2003b705cfSriastradh * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 2103b705cfSriastradh * SOFTWARE. 2203b705cfSriastradh * 2303b705cfSriastradh * Authors: 2403b705cfSriastradh * Chris Wilson <chris@chris-wilson.co.uk> 2503b705cfSriastradh * 2603b705cfSriastradh */ 2703b705cfSriastradh 2803b705cfSriastradh#ifdef HAVE_CONFIG_H 2903b705cfSriastradh#include "config.h" 3003b705cfSriastradh#endif 3103b705cfSriastradh 3203b705cfSriastradh#include "sna.h" 3303b705cfSriastradh#include "sna_reg.h" 3403b705cfSriastradh 3503b705cfSriastradh#include <unistd.h> 3603b705cfSriastradh#include <sys/ioctl.h> 3703b705cfSriastradh#include <sys/mman.h> 389a906b70Schristos#include <sys/stat.h> 3903b705cfSriastradh#include <time.h> 409a906b70Schristos#include <sched.h> 4103b705cfSriastradh#include <errno.h> 4203b705cfSriastradh#include <fcntl.h> 4303b705cfSriastradh 4403b705cfSriastradh#include <xf86drm.h> 4503b705cfSriastradh 4603b705cfSriastradh#ifdef HAVE_VALGRIND 4703b705cfSriastradh#include <valgrind.h> 4803b705cfSriastradh#include <memcheck.h> 4903b705cfSriastradh#endif 5003b705cfSriastradh 5103b705cfSriastradh#ifdef HAVE_STRUCT_SYSINFO_TOTALRAM 5203b705cfSriastradh#include <sys/sysinfo.h> 5303b705cfSriastradh#endif 5403b705cfSriastradh 5503b705cfSriastradh#include "sna_cpuid.h" 5603b705cfSriastradh 5703b705cfSriastradhstatic struct kgem_bo * 5803b705cfSriastradhsearch_linear_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags); 5903b705cfSriastradh 6003b705cfSriastradhstatic struct kgem_bo * 6103b705cfSriastradhsearch_snoop_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags); 6203b705cfSriastradh 6303b705cfSriastradh#define DBG_NO_HW 0 649a906b70Schristos#define DBG_NO_EXEC 0 6503b705cfSriastradh#define DBG_NO_TILING 0 6603b705cfSriastradh#define DBG_NO_CACHE 0 679a906b70Schristos#define DBG_NO_SNOOP_CACHE 0 6803b705cfSriastradh#define DBG_NO_CACHE_LEVEL 0 6903b705cfSriastradh#define DBG_NO_CPU 0 7003b705cfSriastradh#define DBG_NO_CREATE2 0 7103b705cfSriastradh#define DBG_NO_USERPTR 0 7203b705cfSriastradh#define DBG_NO_UNSYNCHRONIZED_USERPTR 0 7363ef14f0Smrg#define DBG_NO_COHERENT_MMAP_GTT 0 7403b705cfSriastradh#define DBG_NO_LLC 0 7503b705cfSriastradh#define DBG_NO_SEMAPHORES 0 7603b705cfSriastradh#define DBG_NO_MADV 0 7703b705cfSriastradh#define DBG_NO_UPLOAD_CACHE 0 7803b705cfSriastradh#define DBG_NO_UPLOAD_ACTIVE 0 7903b705cfSriastradh#define DBG_NO_MAP_UPLOAD 0 8003b705cfSriastradh#define DBG_NO_RELAXED_FENCING 0 8103b705cfSriastradh#define DBG_NO_SECURE_BATCHES 0 8203b705cfSriastradh#define DBG_NO_PINNED_BATCHES 0 83813957e3Ssnj#define DBG_NO_SHRINK_BATCHES 0 8403b705cfSriastradh#define DBG_NO_FAST_RELOC 0 8503b705cfSriastradh#define DBG_NO_HANDLE_LUT 0 8603b705cfSriastradh#define DBG_NO_WT 0 87813957e3Ssnj#define DBG_NO_WC_MMAP 0 8863ef14f0Smrg#define DBG_NO_BLT_Y 0 8963ef14f0Smrg#define DBG_NO_SCANOUT_Y 0 9063ef14f0Smrg#define DBG_NO_DIRTYFB 0 9163ef14f0Smrg#define DBG_NO_DETILING 0 9203b705cfSriastradh#define DBG_DUMP 0 939a906b70Schristos#define DBG_NO_MALLOC_CACHE 0 9403b705cfSriastradh 9503b705cfSriastradh#define FORCE_MMAP_SYNC 0 /* ((1 << DOMAIN_CPU) | (1 << DOMAIN_GTT)) */ 9603b705cfSriastradh 9703b705cfSriastradh#ifndef DEBUG_SYNC 9803b705cfSriastradh#define DEBUG_SYNC 0 9903b705cfSriastradh#endif 10003b705cfSriastradh 1019a906b70Schristos#define SHOW_BATCH_BEFORE 0 1029a906b70Schristos#define SHOW_BATCH_AFTER 0 10303b705cfSriastradh 10403b705cfSriastradh#if 0 10503b705cfSriastradh#define ASSERT_IDLE(kgem__, handle__) assert(!__kgem_busy(kgem__, handle__)) 10603b705cfSriastradh#define ASSERT_MAYBE_IDLE(kgem__, handle__, expect__) assert(!(expect__) || !__kgem_busy(kgem__, handle__)) 10703b705cfSriastradh#else 10803b705cfSriastradh#define ASSERT_IDLE(kgem__, handle__) 10903b705cfSriastradh#define ASSERT_MAYBE_IDLE(kgem__, handle__, expect__) 11003b705cfSriastradh#endif 11103b705cfSriastradh 11203b705cfSriastradh/* Worst case seems to be 965gm where we cannot write within a cacheline that 11303b705cfSriastradh * is being simultaneously being read by the GPU, or within the sampler 11403b705cfSriastradh * prefetch. In general, the chipsets seem to have a requirement that sampler 11503b705cfSriastradh * offsets be aligned to a cacheline (64 bytes). 1169a906b70Schristos * 1179a906b70Schristos * Actually, it turns out the BLT color pattern (BR15) has the most severe 1189a906b70Schristos * alignment restrictions, 64 bytes for 8-bpp, 128 bytes for 16-bpp and 256 1199a906b70Schristos * bytes for 32-bpp. 12003b705cfSriastradh */ 1219a906b70Schristos#define UPLOAD_ALIGNMENT 256 12203b705cfSriastradh 12303b705cfSriastradh#define PAGE_ALIGN(x) ALIGN(x, PAGE_SIZE) 12403b705cfSriastradh#define NUM_PAGES(x) (((x) + PAGE_SIZE-1) / PAGE_SIZE) 12503b705cfSriastradh 12603b705cfSriastradh#define MAX_GTT_VMA_CACHE 512 12703b705cfSriastradh#define MAX_CPU_VMA_CACHE INT16_MAX 12803b705cfSriastradh#define MAP_PRESERVE_TIME 10 12903b705cfSriastradh 1309a906b70Schristos#define MAKE_USER_MAP(ptr) ((void*)((uintptr_t)(ptr) | 1)) 1319a906b70Schristos#define IS_USER_MAP(ptr) ((uintptr_t)(ptr) & 1) 13203b705cfSriastradh 13303b705cfSriastradh#define LOCAL_I915_PARAM_HAS_BLT 11 13403b705cfSriastradh#define LOCAL_I915_PARAM_HAS_RELAXED_FENCING 12 13503b705cfSriastradh#define LOCAL_I915_PARAM_HAS_RELAXED_DELTA 15 136813957e3Ssnj#define LOCAL_I915_PARAM_HAS_LLC 17 13703b705cfSriastradh#define LOCAL_I915_PARAM_HAS_SEMAPHORES 20 13803b705cfSriastradh#define LOCAL_I915_PARAM_HAS_SECURE_BATCHES 23 13903b705cfSriastradh#define LOCAL_I915_PARAM_HAS_PINNED_BATCHES 24 14003b705cfSriastradh#define LOCAL_I915_PARAM_HAS_NO_RELOC 25 14103b705cfSriastradh#define LOCAL_I915_PARAM_HAS_HANDLE_LUT 26 14203b705cfSriastradh#define LOCAL_I915_PARAM_HAS_WT 27 143813957e3Ssnj#define LOCAL_I915_PARAM_MMAP_VERSION 30 14463ef14f0Smrg#define LOCAL_I915_PARAM_MMAP_GTT_COHERENT 52 14503b705cfSriastradh 14603b705cfSriastradh#define LOCAL_I915_EXEC_IS_PINNED (1<<10) 14703b705cfSriastradh#define LOCAL_I915_EXEC_NO_RELOC (1<<11) 14803b705cfSriastradh#define LOCAL_I915_EXEC_HANDLE_LUT (1<<12) 14903b705cfSriastradh 1509a906b70Schristos#define LOCAL_I915_GEM_CREATE2 0x34 15103b705cfSriastradh#define LOCAL_IOCTL_I915_GEM_CREATE2 DRM_IOWR (DRM_COMMAND_BASE + LOCAL_I915_GEM_CREATE2, struct local_i915_gem_create2) 15203b705cfSriastradhstruct local_i915_gem_create2 { 15303b705cfSriastradh uint64_t size; 15403b705cfSriastradh uint32_t placement; 15503b705cfSriastradh#define LOCAL_I915_CREATE_PLACEMENT_SYSTEM 0 15603b705cfSriastradh#define LOCAL_I915_CREATE_PLACEMENT_STOLEN 1 /* Cannot use CPU mmaps or pread/pwrite */ 15703b705cfSriastradh uint32_t domain; 15803b705cfSriastradh uint32_t caching; 15903b705cfSriastradh uint32_t tiling_mode; 16003b705cfSriastradh uint32_t stride; 16103b705cfSriastradh uint32_t flags; 16203b705cfSriastradh uint32_t pad; 16303b705cfSriastradh uint32_t handle; 16403b705cfSriastradh}; 16503b705cfSriastradh 16603b705cfSriastradh#define LOCAL_I915_GEM_USERPTR 0x33 16703b705cfSriastradh#define LOCAL_IOCTL_I915_GEM_USERPTR DRM_IOWR (DRM_COMMAND_BASE + LOCAL_I915_GEM_USERPTR, struct local_i915_gem_userptr) 16803b705cfSriastradhstruct local_i915_gem_userptr { 16903b705cfSriastradh uint64_t user_ptr; 17003b705cfSriastradh uint64_t user_size; 17103b705cfSriastradh uint32_t flags; 1729a906b70Schristos#define I915_USERPTR_READ_ONLY 0x1 1739a906b70Schristos#define I915_USERPTR_UNSYNCHRONIZED 0x80000000 17403b705cfSriastradh uint32_t handle; 17503b705cfSriastradh}; 17603b705cfSriastradh 17703b705cfSriastradh#define UNCACHED 0 17803b705cfSriastradh#define SNOOPED 1 17903b705cfSriastradh#define DISPLAY 2 18003b705cfSriastradh 18103b705cfSriastradhstruct local_i915_gem_caching { 18203b705cfSriastradh uint32_t handle; 18303b705cfSriastradh uint32_t caching; 18403b705cfSriastradh}; 18503b705cfSriastradh 18603b705cfSriastradh#define LOCAL_I915_GEM_SET_CACHING 0x2f 1879a906b70Schristos#define LOCAL_I915_GEM_GET_CACHING 0x30 18803b705cfSriastradh#define LOCAL_IOCTL_I915_GEM_SET_CACHING DRM_IOW(DRM_COMMAND_BASE + LOCAL_I915_GEM_SET_CACHING, struct local_i915_gem_caching) 1899a906b70Schristos#define LOCAL_IOCTL_I915_GEM_GET_CACHING DRM_IOW(DRM_COMMAND_BASE + LOCAL_I915_GEM_GET_CACHING, struct local_i915_gem_caching) 19003b705cfSriastradh 19163ef14f0Smrgstruct local_i915_gem_mmap { 19263ef14f0Smrg uint32_t handle; 19363ef14f0Smrg uint32_t pad; 19463ef14f0Smrg uint64_t offset; 19563ef14f0Smrg uint64_t size; 19663ef14f0Smrg uint64_t addr_ptr; 19763ef14f0Smrg}; 19863ef14f0Smrg#define LOCAL_IOCTL_I915_GEM_MMAP DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MMAP, struct local_i915_gem_mmap) 19963ef14f0Smrg 200813957e3Ssnjstruct local_i915_gem_mmap2 { 201813957e3Ssnj uint32_t handle; 202813957e3Ssnj uint32_t pad; 203813957e3Ssnj uint64_t offset; 204813957e3Ssnj uint64_t size; 205813957e3Ssnj uint64_t addr_ptr; 206813957e3Ssnj uint64_t flags; 207813957e3Ssnj#define I915_MMAP_WC 0x1 208813957e3Ssnj}; 209813957e3Ssnj#define LOCAL_IOCTL_I915_GEM_MMAP_v2 DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MMAP, struct local_i915_gem_mmap2) 210813957e3Ssnj 21103b705cfSriastradhstruct kgem_buffer { 21203b705cfSriastradh struct kgem_bo base; 21303b705cfSriastradh void *mem; 21403b705cfSriastradh uint32_t used; 21503b705cfSriastradh uint32_t need_io : 1; 21603b705cfSriastradh uint32_t write : 2; 2179a906b70Schristos uint32_t mmapped : 2; 2189a906b70Schristos}; 2199a906b70Schristosenum { 2209a906b70Schristos MMAPPED_NONE, 2219a906b70Schristos MMAPPED_GTT, 2229a906b70Schristos MMAPPED_CPU 22303b705cfSriastradh}; 22403b705cfSriastradh 22503b705cfSriastradhstatic struct kgem_bo *__kgem_freed_bo; 22603b705cfSriastradhstatic struct kgem_request *__kgem_freed_request; 22703b705cfSriastradhstatic struct drm_i915_gem_exec_object2 _kgem_dummy_exec; 22803b705cfSriastradh 22963ef14f0Smrgstatic inline struct sna *__to_sna(struct kgem *kgem) 23063ef14f0Smrg{ 23163ef14f0Smrg /* minor layering violations */ 23263ef14f0Smrg return container_of(kgem, struct sna, kgem); 23363ef14f0Smrg} 23463ef14f0Smrg 23503b705cfSriastradhstatic inline int bytes(struct kgem_bo *bo) 23603b705cfSriastradh{ 23703b705cfSriastradh return __kgem_bo_size(bo); 23803b705cfSriastradh} 23903b705cfSriastradh 24003b705cfSriastradh#define bucket(B) (B)->size.pages.bucket 24103b705cfSriastradh#define num_pages(B) (B)->size.pages.count 24203b705cfSriastradh 24363ef14f0Smrgstatic int __do_ioctl(int fd, unsigned long req, void *arg) 2449a906b70Schristos{ 24563ef14f0Smrg do { 24663ef14f0Smrg int err; 2479a906b70Schristos 24863ef14f0Smrg switch ((err = errno)) { 24963ef14f0Smrg case EAGAIN: 25063ef14f0Smrg sched_yield(); 25163ef14f0Smrg case EINTR: 25263ef14f0Smrg break; 25363ef14f0Smrg default: 25463ef14f0Smrg return -err; 25563ef14f0Smrg } 2569a906b70Schristos 25763ef14f0Smrg if (likely(ioctl(fd, req, arg) == 0)) 25863ef14f0Smrg return 0; 25963ef14f0Smrg } while (1); 26063ef14f0Smrg} 2619a906b70Schristos 26263ef14f0Smrginline static int do_ioctl(int fd, unsigned long req, void *arg) 26363ef14f0Smrg{ 26463ef14f0Smrg if (likely(ioctl(fd, req, arg) == 0)) 26563ef14f0Smrg return 0; 2669a906b70Schristos 26763ef14f0Smrg return __do_ioctl(fd, req, arg); 2689a906b70Schristos} 2699a906b70Schristos 27003b705cfSriastradh#ifdef DEBUG_MEMORY 27103b705cfSriastradhstatic void debug_alloc(struct kgem *kgem, size_t size) 27203b705cfSriastradh{ 27303b705cfSriastradh kgem->debug_memory.bo_allocs++; 27403b705cfSriastradh kgem->debug_memory.bo_bytes += size; 27503b705cfSriastradh} 27603b705cfSriastradhstatic void debug_alloc__bo(struct kgem *kgem, struct kgem_bo *bo) 27703b705cfSriastradh{ 27803b705cfSriastradh debug_alloc(kgem, bytes(bo)); 27903b705cfSriastradh} 28003b705cfSriastradh#else 28103b705cfSriastradh#define debug_alloc__bo(k, b) 28203b705cfSriastradh#endif 28303b705cfSriastradh 28403b705cfSriastradh#ifndef NDEBUG 28503b705cfSriastradhstatic void assert_tiling(struct kgem *kgem, struct kgem_bo *bo) 28603b705cfSriastradh{ 28703b705cfSriastradh struct drm_i915_gem_get_tiling tiling; 28803b705cfSriastradh 28903b705cfSriastradh assert(bo); 29003b705cfSriastradh 29163ef14f0Smrg if (!kgem->can_fence && kgem->gen >= 040 && bo->tiling) 29263ef14f0Smrg return; /* lies */ 29363ef14f0Smrg 29403b705cfSriastradh VG_CLEAR(tiling); 29503b705cfSriastradh tiling.handle = bo->handle; 2969a906b70Schristos tiling.tiling_mode = bo->tiling; 2979a906b70Schristos (void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling); 29803b705cfSriastradh assert(tiling.tiling_mode == bo->tiling); 29903b705cfSriastradh} 3009a906b70Schristos 30163ef14f0Smrgstatic void assert_caching(struct kgem *kgem, struct kgem_bo *bo) 3029a906b70Schristos{ 3039a906b70Schristos struct local_i915_gem_caching arg; 3049a906b70Schristos int expect = kgem->has_llc ? SNOOPED : UNCACHED; 3059a906b70Schristos 3069a906b70Schristos VG_CLEAR(arg); 3079a906b70Schristos arg.handle = bo->handle; 3089a906b70Schristos arg.caching = expect; 3099a906b70Schristos 3109a906b70Schristos (void)do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_GET_CACHING, &arg); 3119a906b70Schristos 3129a906b70Schristos assert(arg.caching == expect); 3139a906b70Schristos} 3149a906b70Schristos 3159a906b70Schristosstatic void assert_bo_retired(struct kgem_bo *bo) 3169a906b70Schristos{ 3179a906b70Schristos DBG(("%s: handle=%d, domain: %d exec? %d, rq? %d\n", __FUNCTION__, 3189a906b70Schristos bo->handle, bo->domain, bo->exec != NULL, bo->rq != NULL)); 3199a906b70Schristos assert(bo->refcnt); 3209a906b70Schristos assert(bo->rq == NULL); 3219a906b70Schristos assert(bo->exec == NULL); 32263ef14f0Smrg assert(!bo->needs_flush); 3239a906b70Schristos assert(list_is_empty(&bo->request)); 3249a906b70Schristos} 32503b705cfSriastradh#else 32603b705cfSriastradh#define assert_tiling(kgem, bo) 32763ef14f0Smrg#define assert_caching(kgem, bo) 3289a906b70Schristos#define assert_bo_retired(bo) 32903b705cfSriastradh#endif 33003b705cfSriastradh 33163ef14f0Smrgstatic int __find_debugfs(struct kgem *kgem) 33263ef14f0Smrg{ 33363ef14f0Smrg int i; 33463ef14f0Smrg 33563ef14f0Smrg for (i = 0; i < DRM_MAX_MINOR; i++) { 33663ef14f0Smrg char path[80]; 33763ef14f0Smrg 33863ef14f0Smrg sprintf(path, "/sys/kernel/debug/dri/%d/i915_wedged", i); 33963ef14f0Smrg if (access(path, R_OK) == 0) 34063ef14f0Smrg return i; 34163ef14f0Smrg 34263ef14f0Smrg sprintf(path, "/debug/dri/%d/i915_wedged", i); 34363ef14f0Smrg if (access(path, R_OK) == 0) 34463ef14f0Smrg return i; 34563ef14f0Smrg } 34663ef14f0Smrg 34763ef14f0Smrg return -1; 34863ef14f0Smrg} 34963ef14f0Smrg 35063ef14f0Smrgstatic int kgem_get_minor(struct kgem *kgem) 35163ef14f0Smrg{ 35263ef14f0Smrg struct stat st; 35363ef14f0Smrg 35463ef14f0Smrg if (fstat(kgem->fd, &st)) 35563ef14f0Smrg return __find_debugfs(kgem); 35663ef14f0Smrg 35763ef14f0Smrg if (!S_ISCHR(st.st_mode)) 35863ef14f0Smrg return __find_debugfs(kgem); 35963ef14f0Smrg 36063ef14f0Smrg return st.st_rdev & 0x63; 36163ef14f0Smrg} 36263ef14f0Smrg 36363ef14f0Smrgstatic bool find_hang_state(struct kgem *kgem, char *path, int maxlen) 36463ef14f0Smrg{ 36563ef14f0Smrg int minor = kgem_get_minor(kgem); 36663ef14f0Smrg 36763ef14f0Smrg /* Search for our hang state in a few canonical locations. 36863ef14f0Smrg * In the unlikely event of having multiple devices, we 36963ef14f0Smrg * will need to check which minor actually corresponds to ours. 37063ef14f0Smrg */ 37163ef14f0Smrg 37263ef14f0Smrg snprintf(path, maxlen, "/sys/class/drm/card%d/error", minor); 37363ef14f0Smrg if (access(path, R_OK) == 0) 37463ef14f0Smrg return true; 37563ef14f0Smrg 37663ef14f0Smrg snprintf(path, maxlen, "/sys/kernel/debug/dri/%d/i915_error_state", minor); 37763ef14f0Smrg if (access(path, R_OK) == 0) 37863ef14f0Smrg return true; 37963ef14f0Smrg 38063ef14f0Smrg snprintf(path, maxlen, "/debug/dri/%d/i915_error_state", minor); 38163ef14f0Smrg if (access(path, R_OK) == 0) 38263ef14f0Smrg return true; 38363ef14f0Smrg 38463ef14f0Smrg path[0] = '\0'; 38563ef14f0Smrg return false; 38663ef14f0Smrg} 38763ef14f0Smrg 38863ef14f0Smrgstatic bool has_error_state(struct kgem *kgem, char *path) 38963ef14f0Smrg{ 39063ef14f0Smrg bool ret = false; 39163ef14f0Smrg char no; 39263ef14f0Smrg int fd; 39363ef14f0Smrg 39463ef14f0Smrg fd = open(path, O_RDONLY); 39563ef14f0Smrg if (fd >= 0) { 39663ef14f0Smrg ret = read(fd, &no, 1) == 1 && no != 'N'; 39763ef14f0Smrg close(fd); 39863ef14f0Smrg } 39963ef14f0Smrg 40063ef14f0Smrg return ret; 40163ef14f0Smrg} 40263ef14f0Smrg 40363ef14f0Smrgstatic int kgem_get_screen_index(struct kgem *kgem) 40463ef14f0Smrg{ 40563ef14f0Smrg return __to_sna(kgem)->scrn->scrnIndex; 40663ef14f0Smrg} 40763ef14f0Smrg 408813957e3Ssnjstatic void 409813957e3Ssnj__kgem_set_wedged(struct kgem *kgem) 410813957e3Ssnj{ 41163ef14f0Smrg static int once; 41263ef14f0Smrg char path[256]; 41363ef14f0Smrg 41463ef14f0Smrg if (kgem->wedged) 41563ef14f0Smrg return; 41663ef14f0Smrg 41763ef14f0Smrg if (!once && 41863ef14f0Smrg find_hang_state(kgem, path, sizeof(path)) && 41963ef14f0Smrg has_error_state(kgem, path)) { 42063ef14f0Smrg xf86DrvMsg(kgem_get_screen_index(kgem), X_ERROR, 42163ef14f0Smrg "When reporting this, please include %s and the full dmesg.\n", 42263ef14f0Smrg path); 42363ef14f0Smrg once = 1; 42463ef14f0Smrg } 42563ef14f0Smrg 426813957e3Ssnj kgem->wedged = true; 42763ef14f0Smrg sna_render_mark_wedged(__to_sna(kgem)); 428813957e3Ssnj} 429813957e3Ssnj 43003b705cfSriastradhstatic void kgem_sna_reset(struct kgem *kgem) 43103b705cfSriastradh{ 43263ef14f0Smrg struct sna *sna = __to_sna(kgem); 43303b705cfSriastradh 43403b705cfSriastradh sna->render.reset(sna); 43503b705cfSriastradh sna->blt_state.fill_bo = 0; 43603b705cfSriastradh} 43703b705cfSriastradh 43803b705cfSriastradhstatic void kgem_sna_flush(struct kgem *kgem) 43903b705cfSriastradh{ 44063ef14f0Smrg struct sna *sna = __to_sna(kgem); 44103b705cfSriastradh 44203b705cfSriastradh sna->render.flush(sna); 44303b705cfSriastradh 44403b705cfSriastradh if (sna->render.solid_cache.dirty) 44503b705cfSriastradh sna_render_flush_solid(sna); 44603b705cfSriastradh} 44703b705cfSriastradh 44863ef14f0Smrgstatic bool kgem_bo_rmfb(struct kgem *kgem, struct kgem_bo *bo) 44963ef14f0Smrg{ 45063ef14f0Smrg if (bo->scanout && bo->delta) { 45163ef14f0Smrg DBG(("%s: releasing fb=%d for handle=%d\n", 45263ef14f0Smrg __FUNCTION__, bo->delta, bo->handle)); 45363ef14f0Smrg /* XXX will leak if we are not DRM_MASTER. *shrug* */ 45463ef14f0Smrg do_ioctl(kgem->fd, DRM_IOCTL_MODE_RMFB, &bo->delta); 45563ef14f0Smrg bo->delta = 0; 45663ef14f0Smrg return true; 45763ef14f0Smrg } else 45863ef14f0Smrg return false; 45963ef14f0Smrg} 46063ef14f0Smrg 46163ef14f0Smrgstatic bool kgem_set_tiling(struct kgem *kgem, struct kgem_bo *bo, 46263ef14f0Smrg int tiling, int stride) 46303b705cfSriastradh{ 46403b705cfSriastradh struct drm_i915_gem_set_tiling set_tiling; 4659a906b70Schristos int err; 46603b705cfSriastradh 46763ef14f0Smrg if (tiling == bo->tiling) { 46863ef14f0Smrg if (tiling == I915_TILING_NONE) { 46963ef14f0Smrg bo->pitch = stride; 47063ef14f0Smrg return true; 47163ef14f0Smrg } 47263ef14f0Smrg if (stride == bo->pitch) 47363ef14f0Smrg return true; 47463ef14f0Smrg } 47563ef14f0Smrg 47603b705cfSriastradh if (DBG_NO_TILING) 47703b705cfSriastradh return false; 47803b705cfSriastradh 47903b705cfSriastradh VG_CLEAR(set_tiling); 4809a906b70Schristosrestart: 48163ef14f0Smrg set_tiling.handle = bo->handle; 4829a906b70Schristos set_tiling.tiling_mode = tiling; 48363ef14f0Smrg set_tiling.stride = tiling ? stride : 0; 48403b705cfSriastradh 48563ef14f0Smrg if (ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_TILING, &set_tiling) == 0) { 48663ef14f0Smrg bo->tiling = set_tiling.tiling_mode; 48763ef14f0Smrg bo->pitch = set_tiling.tiling_mode ? set_tiling.stride : stride; 48863ef14f0Smrg DBG(("%s: handle=%d, tiling=%d [%d], pitch=%d [%d]: %d\n", 48963ef14f0Smrg __FUNCTION__, bo->handle, 49063ef14f0Smrg bo->tiling, tiling, 49163ef14f0Smrg bo->pitch, stride, 49263ef14f0Smrg set_tiling.tiling_mode == tiling)); 49363ef14f0Smrg return set_tiling.tiling_mode == tiling && bo->pitch >= stride; 49463ef14f0Smrg } 4959a906b70Schristos 4969a906b70Schristos err = errno; 4979a906b70Schristos if (err == EINTR) 4989a906b70Schristos goto restart; 4999a906b70Schristos 5009a906b70Schristos if (err == EAGAIN) { 5019a906b70Schristos sched_yield(); 5029a906b70Schristos goto restart; 5039a906b70Schristos } 5049a906b70Schristos 50563ef14f0Smrg if (err == EBUSY && kgem_bo_rmfb(kgem, bo)) 50663ef14f0Smrg goto restart; 50763ef14f0Smrg 50863ef14f0Smrg ERR(("%s: failed to set-tiling(tiling=%d, pitch=%d) for handle=%d: %d\n", 50963ef14f0Smrg __FUNCTION__, tiling, stride, bo->handle, err)); 5109a906b70Schristos return false; 51103b705cfSriastradh} 51203b705cfSriastradh 51303b705cfSriastradhstatic bool gem_set_caching(int fd, uint32_t handle, int caching) 51403b705cfSriastradh{ 51503b705cfSriastradh struct local_i915_gem_caching arg; 51603b705cfSriastradh 51703b705cfSriastradh VG_CLEAR(arg); 51803b705cfSriastradh arg.handle = handle; 51903b705cfSriastradh arg.caching = caching; 5209a906b70Schristos return do_ioctl(fd, LOCAL_IOCTL_I915_GEM_SET_CACHING, &arg) == 0; 52103b705cfSriastradh} 52203b705cfSriastradh 52303b705cfSriastradhstatic uint32_t gem_userptr(int fd, void *ptr, int size, int read_only) 52403b705cfSriastradh{ 52503b705cfSriastradh struct local_i915_gem_userptr arg; 52603b705cfSriastradh 52703b705cfSriastradh VG_CLEAR(arg); 52803b705cfSriastradh arg.user_ptr = (uintptr_t)ptr; 52903b705cfSriastradh arg.user_size = size; 53003b705cfSriastradh arg.flags = I915_USERPTR_UNSYNCHRONIZED; 53103b705cfSriastradh if (read_only) 53203b705cfSriastradh arg.flags |= I915_USERPTR_READ_ONLY; 53303b705cfSriastradh 53403b705cfSriastradh if (DBG_NO_UNSYNCHRONIZED_USERPTR || 5359a906b70Schristos do_ioctl(fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg)) { 53603b705cfSriastradh arg.flags &= ~I915_USERPTR_UNSYNCHRONIZED; 5379a906b70Schristos if (do_ioctl(fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg)) { 53803b705cfSriastradh DBG(("%s: failed to map %p + %d bytes: %d\n", 53903b705cfSriastradh __FUNCTION__, ptr, size, errno)); 54003b705cfSriastradh return 0; 54103b705cfSriastradh } 54203b705cfSriastradh } 54303b705cfSriastradh 54403b705cfSriastradh return arg.handle; 54503b705cfSriastradh} 54603b705cfSriastradh 5479a906b70Schristosstatic bool __kgem_throttle(struct kgem *kgem, bool harder) 54803b705cfSriastradh{ 5499a906b70Schristos /* Let this be woken up by sigtimer so that we don't block here 5509a906b70Schristos * too much and completely starve X. We will sleep again shortly, 5519a906b70Schristos * and so catch up or detect the hang. 5529a906b70Schristos */ 5539a906b70Schristos do { 5549a906b70Schristos if (ioctl(kgem->fd, DRM_IOCTL_I915_GEM_THROTTLE) == 0) { 5559a906b70Schristos kgem->need_throttle = 0; 5569a906b70Schristos return false; 5579a906b70Schristos } 55803b705cfSriastradh 5599a906b70Schristos if (errno == EIO) 5609a906b70Schristos return true; 5619a906b70Schristos } while (harder); 5629a906b70Schristos 5639a906b70Schristos return false; 5649a906b70Schristos} 5659a906b70Schristos 5669a906b70Schristosstatic bool __kgem_throttle_retire(struct kgem *kgem, unsigned flags) 5679a906b70Schristos{ 5689a906b70Schristos if (flags & CREATE_NO_RETIRE || !kgem->need_retire) { 5699a906b70Schristos DBG(("%s: not retiring\n", __FUNCTION__)); 57003b705cfSriastradh return false; 57103b705cfSriastradh } 57203b705cfSriastradh 57303b705cfSriastradh if (kgem_retire(kgem)) 57403b705cfSriastradh return true; 57503b705cfSriastradh 57603b705cfSriastradh if (flags & CREATE_NO_THROTTLE || !kgem->need_throttle) { 57703b705cfSriastradh DBG(("%s: not throttling\n", __FUNCTION__)); 57803b705cfSriastradh return false; 57903b705cfSriastradh } 58003b705cfSriastradh 5819a906b70Schristos __kgem_throttle(kgem, false); 58203b705cfSriastradh return kgem_retire(kgem); 58303b705cfSriastradh} 58403b705cfSriastradh 58503b705cfSriastradhstatic void *__kgem_bo_map__gtt(struct kgem *kgem, struct kgem_bo *bo) 58603b705cfSriastradh{ 587813957e3Ssnj struct drm_i915_gem_mmap_gtt gtt; 58803b705cfSriastradh void *ptr; 5893d02bce8Sriastradh int err; 59003b705cfSriastradh 59103b705cfSriastradh DBG(("%s(handle=%d, size=%d)\n", __FUNCTION__, 59203b705cfSriastradh bo->handle, bytes(bo))); 59303b705cfSriastradh 59463ef14f0Smrg if (bo->tiling && !kgem->can_fence) 59563ef14f0Smrg return NULL; 59663ef14f0Smrg 597813957e3Ssnj VG_CLEAR(gtt); 59803b705cfSriastradhretry_gtt: 599813957e3Ssnj gtt.handle = bo->handle; 600813957e3Ssnj if ((err = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MMAP_GTT, >t))) { 60163ef14f0Smrg DBG(("%s: failed %d, throttling/cleaning caches\n", 60263ef14f0Smrg __FUNCTION__, err)); 60303b705cfSriastradh assert(err != EINVAL); 60403b705cfSriastradh 60503b705cfSriastradh (void)__kgem_throttle_retire(kgem, 0); 60603b705cfSriastradh if (kgem_expire_cache(kgem)) 60703b705cfSriastradh goto retry_gtt; 60803b705cfSriastradh 6099a906b70Schristos if (kgem_cleanup_cache(kgem)) 61003b705cfSriastradh goto retry_gtt; 61103b705cfSriastradh 6129a906b70Schristos ERR(("%s: failed to retrieve GTT offset for handle=%d: %d\n", 6139a906b70Schristos __FUNCTION__, bo->handle, -err)); 61403b705cfSriastradh return NULL; 61503b705cfSriastradh } 61603b705cfSriastradh 61703b705cfSriastradhretry_mmap: 6189a906b70Schristos ptr = mmap(0, bytes(bo), PROT_READ | PROT_WRITE, MAP_SHARED, 619813957e3Ssnj kgem->fd, gtt.offset); 6209a906b70Schristos if (ptr == MAP_FAILED) { 6219a906b70Schristos err = errno; 62263ef14f0Smrg DBG(("%s: failed %d, throttling/cleaning caches\n", 62363ef14f0Smrg __FUNCTION__, err)); 62403b705cfSriastradh assert(err != EINVAL); 62503b705cfSriastradh 62603b705cfSriastradh if (__kgem_throttle_retire(kgem, 0)) 62703b705cfSriastradh goto retry_mmap; 62803b705cfSriastradh 6299a906b70Schristos if (kgem_cleanup_cache(kgem)) 63003b705cfSriastradh goto retry_mmap; 63103b705cfSriastradh 6329a906b70Schristos ERR(("%s: failed to mmap handle=%d, %d bytes, into GTT domain: %d\n", 6339a906b70Schristos __FUNCTION__, bo->handle, bytes(bo), err)); 63403b705cfSriastradh ptr = NULL; 63503b705cfSriastradh } 63603b705cfSriastradh 637813957e3Ssnj /* Cache this mapping to avoid the overhead of an 638813957e3Ssnj * excruciatingly slow GTT pagefault. This is more an 639813957e3Ssnj * issue with compositing managers which need to 640813957e3Ssnj * frequently flush CPU damage to their GPU bo. 641813957e3Ssnj */ 642813957e3Ssnj return bo->map__gtt = ptr; 643813957e3Ssnj} 644813957e3Ssnj 645813957e3Ssnjstatic void *__kgem_bo_map__wc(struct kgem *kgem, struct kgem_bo *bo) 646813957e3Ssnj{ 647813957e3Ssnj struct local_i915_gem_mmap2 wc; 648813957e3Ssnj int err; 649813957e3Ssnj 650813957e3Ssnj DBG(("%s(handle=%d, size=%d)\n", __FUNCTION__, 651813957e3Ssnj bo->handle, bytes(bo))); 652813957e3Ssnj assert(kgem->has_wc_mmap); 653813957e3Ssnj 654813957e3Ssnj VG_CLEAR(wc); 655813957e3Ssnj 656813957e3Ssnjretry_wc: 657813957e3Ssnj wc.handle = bo->handle; 658813957e3Ssnj wc.offset = 0; 659813957e3Ssnj wc.size = bytes(bo); 660813957e3Ssnj wc.flags = I915_MMAP_WC; 661813957e3Ssnj if ((err = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_MMAP_v2, &wc))) { 66263ef14f0Smrg DBG(("%s: failed %d, throttling/cleaning caches\n", 66363ef14f0Smrg __FUNCTION__, err)); 664813957e3Ssnj assert(err != EINVAL); 665813957e3Ssnj 666813957e3Ssnj if (__kgem_throttle_retire(kgem, 0)) 667813957e3Ssnj goto retry_wc; 668813957e3Ssnj 669813957e3Ssnj if (kgem_cleanup_cache(kgem)) 670813957e3Ssnj goto retry_wc; 671813957e3Ssnj 672813957e3Ssnj ERR(("%s: failed to mmap handle=%d, %d bytes, into CPU(wc) domain: %d\n", 673813957e3Ssnj __FUNCTION__, bo->handle, bytes(bo), -err)); 674813957e3Ssnj return NULL; 675813957e3Ssnj } 676813957e3Ssnj 677813957e3Ssnj VG(VALGRIND_MAKE_MEM_DEFINED(wc.addr_ptr, bytes(bo))); 678813957e3Ssnj 679813957e3Ssnj DBG(("%s: caching CPU(wc) vma for %d\n", __FUNCTION__, bo->handle)); 680813957e3Ssnj return bo->map__wc = (void *)(uintptr_t)wc.addr_ptr; 681813957e3Ssnj} 682813957e3Ssnj 683813957e3Ssnjstatic void *__kgem_bo_map__cpu(struct kgem *kgem, struct kgem_bo *bo) 684813957e3Ssnj{ 68563ef14f0Smrg struct local_i915_gem_mmap arg; 686813957e3Ssnj int err; 687813957e3Ssnj 68863ef14f0Smrg VG_CLEAR(arg); 68963ef14f0Smrg arg.offset = 0; 69063ef14f0Smrg 691813957e3Ssnjretry: 69263ef14f0Smrg arg.handle = bo->handle; 69363ef14f0Smrg arg.size = bytes(bo); 69463ef14f0Smrg if ((err = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_MMAP, &arg))) { 69563ef14f0Smrg DBG(("%s: failed %d, throttling/cleaning caches\n", 69663ef14f0Smrg __FUNCTION__, err)); 69763ef14f0Smrg assert(err != -EINVAL || bo->prime); 698813957e3Ssnj 699813957e3Ssnj if (__kgem_throttle_retire(kgem, 0)) 700813957e3Ssnj goto retry; 701813957e3Ssnj 702813957e3Ssnj if (kgem_cleanup_cache(kgem)) 703813957e3Ssnj goto retry; 704813957e3Ssnj 70563ef14f0Smrg ERR(("%s: failed to mmap handle=%d (prime? %d), %d bytes, into CPU domain: %d\n", 70663ef14f0Smrg __FUNCTION__, bo->handle, bo->prime, bytes(bo), -err)); 70763ef14f0Smrg bo->purged = 1; 708813957e3Ssnj return NULL; 709813957e3Ssnj } 710813957e3Ssnj 71163ef14f0Smrg VG(VALGRIND_MAKE_MEM_DEFINED(arg.addr_ptr, bytes(bo))); 712813957e3Ssnj 713813957e3Ssnj DBG(("%s: caching CPU vma for %d\n", __FUNCTION__, bo->handle)); 71463ef14f0Smrg return bo->map__cpu = (void *)(uintptr_t)arg.addr_ptr; 71503b705cfSriastradh} 71603b705cfSriastradh 7179a906b70Schristosstatic int gem_write(int fd, uint32_t handle, 7189a906b70Schristos int offset, int length, 7199a906b70Schristos const void *src) 72003b705cfSriastradh{ 72103b705cfSriastradh struct drm_i915_gem_pwrite pwrite; 72203b705cfSriastradh 72303b705cfSriastradh DBG(("%s(handle=%d, offset=%d, len=%d)\n", __FUNCTION__, 72403b705cfSriastradh handle, offset, length)); 72503b705cfSriastradh 72603b705cfSriastradh VG_CLEAR(pwrite); 72703b705cfSriastradh pwrite.handle = handle; 72803b705cfSriastradh pwrite.offset = offset; 72903b705cfSriastradh pwrite.size = length; 73003b705cfSriastradh pwrite.data_ptr = (uintptr_t)src; 7319a906b70Schristos return do_ioctl(fd, DRM_IOCTL_I915_GEM_PWRITE, &pwrite); 73203b705cfSriastradh} 73303b705cfSriastradh 7349a906b70Schristosstatic int gem_write__cachealigned(int fd, uint32_t handle, 7359a906b70Schristos int offset, int length, 7369a906b70Schristos const void *src) 73703b705cfSriastradh{ 73803b705cfSriastradh struct drm_i915_gem_pwrite pwrite; 73903b705cfSriastradh 74003b705cfSriastradh DBG(("%s(handle=%d, offset=%d, len=%d)\n", __FUNCTION__, 74103b705cfSriastradh handle, offset, length)); 74203b705cfSriastradh 74303b705cfSriastradh VG_CLEAR(pwrite); 74403b705cfSriastradh pwrite.handle = handle; 74503b705cfSriastradh /* align the transfer to cachelines; fortuitously this is safe! */ 74603b705cfSriastradh if ((offset | length) & 63) { 74703b705cfSriastradh pwrite.offset = offset & ~63; 74803b705cfSriastradh pwrite.size = ALIGN(offset+length, 64) - pwrite.offset; 74903b705cfSriastradh pwrite.data_ptr = (uintptr_t)src + pwrite.offset - offset; 75003b705cfSriastradh } else { 75103b705cfSriastradh pwrite.offset = offset; 75203b705cfSriastradh pwrite.size = length; 75303b705cfSriastradh pwrite.data_ptr = (uintptr_t)src; 75403b705cfSriastradh } 7559a906b70Schristos return do_ioctl(fd, DRM_IOCTL_I915_GEM_PWRITE, &pwrite); 75603b705cfSriastradh} 75703b705cfSriastradh 75803b705cfSriastradhstatic int gem_read(int fd, uint32_t handle, const void *dst, 75903b705cfSriastradh int offset, int length) 76003b705cfSriastradh{ 76103b705cfSriastradh struct drm_i915_gem_pread pread; 76203b705cfSriastradh int ret; 76303b705cfSriastradh 76403b705cfSriastradh DBG(("%s(handle=%d, len=%d)\n", __FUNCTION__, 76503b705cfSriastradh handle, length)); 76603b705cfSriastradh 76703b705cfSriastradh VG_CLEAR(pread); 76803b705cfSriastradh pread.handle = handle; 76903b705cfSriastradh pread.offset = offset; 77003b705cfSriastradh pread.size = length; 77103b705cfSriastradh pread.data_ptr = (uintptr_t)dst; 7729a906b70Schristos ret = do_ioctl(fd, DRM_IOCTL_I915_GEM_PREAD, &pread); 77303b705cfSriastradh if (ret) { 7749a906b70Schristos DBG(("%s: failed, errno=%d\n", __FUNCTION__, -ret)); 77503b705cfSriastradh return ret; 77603b705cfSriastradh } 77703b705cfSriastradh 77803b705cfSriastradh VG(VALGRIND_MAKE_MEM_DEFINED(dst, length)); 77903b705cfSriastradh return 0; 78003b705cfSriastradh} 78103b705cfSriastradh 78203b705cfSriastradhbool __kgem_busy(struct kgem *kgem, int handle) 78303b705cfSriastradh{ 78403b705cfSriastradh struct drm_i915_gem_busy busy; 78503b705cfSriastradh 78603b705cfSriastradh VG_CLEAR(busy); 78703b705cfSriastradh busy.handle = handle; 78803b705cfSriastradh busy.busy = !kgem->wedged; 7899a906b70Schristos (void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_BUSY, &busy); 79003b705cfSriastradh DBG(("%s: handle=%d, busy=%d, wedged=%d\n", 79103b705cfSriastradh __FUNCTION__, handle, busy.busy, kgem->wedged)); 79203b705cfSriastradh 79303b705cfSriastradh return busy.busy; 79403b705cfSriastradh} 79503b705cfSriastradh 79603b705cfSriastradhstatic void kgem_bo_retire(struct kgem *kgem, struct kgem_bo *bo) 79703b705cfSriastradh{ 79803b705cfSriastradh DBG(("%s: retiring bo handle=%d (needed flush? %d), rq? %d [busy?=%d]\n", 79903b705cfSriastradh __FUNCTION__, bo->handle, bo->needs_flush, bo->rq != NULL, 80003b705cfSriastradh __kgem_busy(kgem, bo->handle))); 80103b705cfSriastradh assert(bo->exec == NULL); 80203b705cfSriastradh assert(list_is_empty(&bo->vma)); 80303b705cfSriastradh 80463ef14f0Smrg if (bo->rq) 80563ef14f0Smrg __kgem_retire_requests_upto(kgem, bo); 80663ef14f0Smrg ASSERT_IDLE(kgem, bo->handle); 80763ef14f0Smrg assert_bo_retired(bo); 8089a906b70Schristos} 8099a906b70Schristos 8109a906b70Schristosstatic void kgem_bo_maybe_retire(struct kgem *kgem, struct kgem_bo *bo) 8119a906b70Schristos{ 8129a906b70Schristos DBG(("%s: retiring bo handle=%d (needed flush? %d), rq? %d [busy?=%d]\n", 8139a906b70Schristos __FUNCTION__, bo->handle, bo->needs_flush, bo->rq != NULL, 8149a906b70Schristos __kgem_busy(kgem, bo->handle))); 8159a906b70Schristos assert(bo->exec == NULL); 8169a906b70Schristos assert(list_is_empty(&bo->vma)); 8179a906b70Schristos 81803b705cfSriastradh if (bo->rq) { 81963ef14f0Smrg if (!__kgem_busy(kgem, bo->handle)) 82063ef14f0Smrg __kgem_retire_requests_upto(kgem, bo); 82103b705cfSriastradh } else { 82203b705cfSriastradh assert(!bo->needs_flush); 82303b705cfSriastradh ASSERT_IDLE(kgem, bo->handle); 82403b705cfSriastradh } 82503b705cfSriastradh} 82603b705cfSriastradh 82703b705cfSriastradhbool kgem_bo_write(struct kgem *kgem, struct kgem_bo *bo, 82803b705cfSriastradh const void *data, int length) 82903b705cfSriastradh{ 830813957e3Ssnj void *ptr; 8319a906b70Schristos int err; 8329a906b70Schristos 83303b705cfSriastradh assert(bo->refcnt); 83403b705cfSriastradh assert(bo->proxy == NULL); 83503b705cfSriastradh ASSERT_IDLE(kgem, bo->handle); 83603b705cfSriastradh 83703b705cfSriastradh assert(length <= bytes(bo)); 8389a906b70Schristosretry: 839813957e3Ssnj ptr = NULL; 840813957e3Ssnj if (bo->domain == DOMAIN_CPU || (kgem->has_llc && !bo->scanout)) { 841813957e3Ssnj ptr = bo->map__cpu; 842813957e3Ssnj if (ptr == NULL) 843813957e3Ssnj ptr = __kgem_bo_map__cpu(kgem, bo); 844813957e3Ssnj } else if (kgem->has_wc_mmap) { 845813957e3Ssnj ptr = bo->map__wc; 846813957e3Ssnj if (ptr == NULL) 847813957e3Ssnj ptr = __kgem_bo_map__wc(kgem, bo); 848813957e3Ssnj } 849813957e3Ssnj if (ptr) { 850813957e3Ssnj /* XXX unsynchronized? */ 851813957e3Ssnj memcpy(ptr, data, length); 852813957e3Ssnj return true; 853813957e3Ssnj } 854813957e3Ssnj 8559a906b70Schristos if ((err = gem_write(kgem->fd, bo->handle, 0, length, data))) { 85663ef14f0Smrg DBG(("%s: failed %d, throttling/cleaning caches\n", 85763ef14f0Smrg __FUNCTION__, err)); 8589a906b70Schristos assert(err != EINVAL); 8599a906b70Schristos 8609a906b70Schristos (void)__kgem_throttle_retire(kgem, 0); 8619a906b70Schristos if (kgem_expire_cache(kgem)) 8629a906b70Schristos goto retry; 8639a906b70Schristos 8649a906b70Schristos if (kgem_cleanup_cache(kgem)) 8659a906b70Schristos goto retry; 8669a906b70Schristos 8679a906b70Schristos ERR(("%s: failed to write %d bytes into BO handle=%d: %d\n", 8689a906b70Schristos __FUNCTION__, length, bo->handle, -err)); 86903b705cfSriastradh return false; 8709a906b70Schristos } 87103b705cfSriastradh 87203b705cfSriastradh DBG(("%s: flush=%d, domain=%d\n", __FUNCTION__, bo->flush, bo->domain)); 8739a906b70Schristos if (bo->exec == NULL) 8749a906b70Schristos kgem_bo_maybe_retire(kgem, bo); 8759a906b70Schristos bo->domain = DOMAIN_NONE; 87603b705cfSriastradh bo->gtt_dirty = true; 87703b705cfSriastradh return true; 87803b705cfSriastradh} 87903b705cfSriastradh 88003b705cfSriastradhstatic uint32_t gem_create(int fd, int num_pages) 88103b705cfSriastradh{ 88203b705cfSriastradh struct drm_i915_gem_create create; 88303b705cfSriastradh 88403b705cfSriastradh VG_CLEAR(create); 88503b705cfSriastradh create.handle = 0; 88603b705cfSriastradh create.size = PAGE_SIZE * num_pages; 8879a906b70Schristos (void)do_ioctl(fd, DRM_IOCTL_I915_GEM_CREATE, &create); 88803b705cfSriastradh 88903b705cfSriastradh return create.handle; 89003b705cfSriastradh} 89103b705cfSriastradh 89263ef14f0Smrgstatic void 89303b705cfSriastradhkgem_bo_set_purgeable(struct kgem *kgem, struct kgem_bo *bo) 89403b705cfSriastradh{ 89563ef14f0Smrg#if !DBG_NO_MADV 89603b705cfSriastradh struct drm_i915_gem_madvise madv; 89703b705cfSriastradh 89803b705cfSriastradh assert(bo->exec == NULL); 89903b705cfSriastradh 90003b705cfSriastradh VG_CLEAR(madv); 90103b705cfSriastradh madv.handle = bo->handle; 90203b705cfSriastradh madv.madv = I915_MADV_DONTNEED; 9039a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MADVISE, &madv) == 0) { 90463ef14f0Smrg bo->purged = true; 90563ef14f0Smrg kgem->need_purge |= !madv.retained && bo->domain != DOMAIN_CPU; 90603b705cfSriastradh } 90703b705cfSriastradh#endif 90803b705cfSriastradh} 90903b705cfSriastradh 91003b705cfSriastradhstatic bool 91103b705cfSriastradhkgem_bo_is_retained(struct kgem *kgem, struct kgem_bo *bo) 91203b705cfSriastradh{ 91303b705cfSriastradh#if DBG_NO_MADV 91403b705cfSriastradh return true; 91503b705cfSriastradh#else 91603b705cfSriastradh struct drm_i915_gem_madvise madv; 91703b705cfSriastradh 91803b705cfSriastradh if (!bo->purged) 91903b705cfSriastradh return true; 92003b705cfSriastradh 92103b705cfSriastradh VG_CLEAR(madv); 92203b705cfSriastradh madv.handle = bo->handle; 92303b705cfSriastradh madv.madv = I915_MADV_DONTNEED; 9249a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MADVISE, &madv) == 0) 92503b705cfSriastradh return madv.retained; 92603b705cfSriastradh 92703b705cfSriastradh return false; 92803b705cfSriastradh#endif 92903b705cfSriastradh} 93003b705cfSriastradh 93103b705cfSriastradhstatic bool 93203b705cfSriastradhkgem_bo_clear_purgeable(struct kgem *kgem, struct kgem_bo *bo) 93303b705cfSriastradh{ 93403b705cfSriastradh#if DBG_NO_MADV 93503b705cfSriastradh return true; 93603b705cfSriastradh#else 93703b705cfSriastradh struct drm_i915_gem_madvise madv; 93803b705cfSriastradh 93903b705cfSriastradh assert(bo->purged); 94003b705cfSriastradh 94103b705cfSriastradh VG_CLEAR(madv); 94203b705cfSriastradh madv.handle = bo->handle; 94303b705cfSriastradh madv.madv = I915_MADV_WILLNEED; 9449a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_MADVISE, &madv) == 0) { 94503b705cfSriastradh bo->purged = !madv.retained; 94663ef14f0Smrg kgem->need_purge |= !madv.retained && bo->domain != DOMAIN_CPU; 94703b705cfSriastradh return madv.retained; 94803b705cfSriastradh } 94903b705cfSriastradh 95003b705cfSriastradh return false; 95103b705cfSriastradh#endif 95203b705cfSriastradh} 95303b705cfSriastradh 95403b705cfSriastradhstatic void gem_close(int fd, uint32_t handle) 95503b705cfSriastradh{ 95603b705cfSriastradh struct drm_gem_close close; 95703b705cfSriastradh 95803b705cfSriastradh VG_CLEAR(close); 95903b705cfSriastradh close.handle = handle; 9609a906b70Schristos (void)do_ioctl(fd, DRM_IOCTL_GEM_CLOSE, &close); 96103b705cfSriastradh} 96203b705cfSriastradh 96303b705cfSriastradhconstant inline static unsigned long __fls(unsigned long word) 96403b705cfSriastradh{ 96503b705cfSriastradh#if defined(__GNUC__) && (defined(__i386__) || defined(__x86__) || defined(__x86_64__)) 96603b705cfSriastradh asm("bsr %1,%0" 96703b705cfSriastradh : "=r" (word) 96803b705cfSriastradh : "rm" (word)); 96903b705cfSriastradh return word; 97003b705cfSriastradh#else 97103b705cfSriastradh unsigned int v = 0; 97203b705cfSriastradh 97303b705cfSriastradh while (word >>= 1) 97403b705cfSriastradh v++; 97503b705cfSriastradh 97603b705cfSriastradh return v; 97703b705cfSriastradh#endif 97803b705cfSriastradh} 97903b705cfSriastradh 98003b705cfSriastradhconstant inline static int cache_bucket(int num_pages) 98103b705cfSriastradh{ 98203b705cfSriastradh return __fls(num_pages); 98303b705cfSriastradh} 98403b705cfSriastradh 98503b705cfSriastradhstatic struct kgem_bo *__kgem_bo_init(struct kgem_bo *bo, 98603b705cfSriastradh int handle, int num_pages) 98703b705cfSriastradh{ 9889a906b70Schristos DBG(("%s(handle=%d, num_pages=%d)\n", __FUNCTION__, handle, num_pages)); 9899a906b70Schristos 99003b705cfSriastradh assert(num_pages); 99103b705cfSriastradh memset(bo, 0, sizeof(*bo)); 99203b705cfSriastradh 99303b705cfSriastradh bo->refcnt = 1; 99403b705cfSriastradh bo->handle = handle; 99503b705cfSriastradh bo->target_handle = -1; 99603b705cfSriastradh num_pages(bo) = num_pages; 99703b705cfSriastradh bucket(bo) = cache_bucket(num_pages); 99803b705cfSriastradh bo->reusable = true; 99903b705cfSriastradh bo->domain = DOMAIN_CPU; 100003b705cfSriastradh list_init(&bo->request); 100103b705cfSriastradh list_init(&bo->list); 100203b705cfSriastradh list_init(&bo->vma); 100303b705cfSriastradh 100403b705cfSriastradh return bo; 100503b705cfSriastradh} 100603b705cfSriastradh 100703b705cfSriastradhstatic struct kgem_bo *__kgem_bo_alloc(int handle, int num_pages) 100803b705cfSriastradh{ 100903b705cfSriastradh struct kgem_bo *bo; 101003b705cfSriastradh 101103b705cfSriastradh if (__kgem_freed_bo) { 101203b705cfSriastradh bo = __kgem_freed_bo; 101303b705cfSriastradh __kgem_freed_bo = *(struct kgem_bo **)bo; 101403b705cfSriastradh } else { 101503b705cfSriastradh bo = malloc(sizeof(*bo)); 101603b705cfSriastradh if (bo == NULL) 101703b705cfSriastradh return NULL; 101803b705cfSriastradh } 101903b705cfSriastradh 102003b705cfSriastradh return __kgem_bo_init(bo, handle, num_pages); 102103b705cfSriastradh} 102203b705cfSriastradh 102303b705cfSriastradhstatic struct kgem_request *__kgem_request_alloc(struct kgem *kgem) 102403b705cfSriastradh{ 102503b705cfSriastradh struct kgem_request *rq; 102603b705cfSriastradh 102763ef14f0Smrg if (unlikely(kgem->wedged)) { 102863ef14f0Smrg rq = &kgem->static_request; 102903b705cfSriastradh } else { 103063ef14f0Smrg rq = __kgem_freed_request; 103163ef14f0Smrg if (rq) { 103263ef14f0Smrg __kgem_freed_request = *(struct kgem_request **)rq; 103363ef14f0Smrg } else { 103463ef14f0Smrg rq = malloc(sizeof(*rq)); 103563ef14f0Smrg if (rq == NULL) 103663ef14f0Smrg rq = &kgem->static_request; 103763ef14f0Smrg } 103803b705cfSriastradh } 103903b705cfSriastradh 104003b705cfSriastradh list_init(&rq->buffers); 104103b705cfSriastradh rq->bo = NULL; 104203b705cfSriastradh rq->ring = 0; 104303b705cfSriastradh 104403b705cfSriastradh return rq; 104503b705cfSriastradh} 104603b705cfSriastradh 104703b705cfSriastradhstatic void __kgem_request_free(struct kgem_request *rq) 104803b705cfSriastradh{ 104903b705cfSriastradh _list_del(&rq->list); 10509a906b70Schristos if (DBG_NO_MALLOC_CACHE) { 10519a906b70Schristos free(rq); 10529a906b70Schristos } else { 10539a906b70Schristos *(struct kgem_request **)rq = __kgem_freed_request; 10549a906b70Schristos __kgem_freed_request = rq; 10559a906b70Schristos } 105603b705cfSriastradh} 105703b705cfSriastradh 105803b705cfSriastradhstatic struct list *inactive(struct kgem *kgem, int num_pages) 105903b705cfSriastradh{ 106003b705cfSriastradh assert(num_pages < MAX_CACHE_SIZE / PAGE_SIZE); 106103b705cfSriastradh assert(cache_bucket(num_pages) < NUM_CACHE_BUCKETS); 106203b705cfSriastradh return &kgem->inactive[cache_bucket(num_pages)]; 106303b705cfSriastradh} 106403b705cfSriastradh 106503b705cfSriastradhstatic struct list *active(struct kgem *kgem, int num_pages, int tiling) 106603b705cfSriastradh{ 106703b705cfSriastradh assert(num_pages < MAX_CACHE_SIZE / PAGE_SIZE); 106803b705cfSriastradh assert(cache_bucket(num_pages) < NUM_CACHE_BUCKETS); 106903b705cfSriastradh return &kgem->active[cache_bucket(num_pages)][tiling]; 107003b705cfSriastradh} 107103b705cfSriastradh 107203b705cfSriastradhstatic size_t 107303b705cfSriastradhagp_aperture_size(struct pci_device *dev, unsigned gen) 107403b705cfSriastradh{ 107503b705cfSriastradh /* XXX assume that only future chipsets are unknown and follow 107603b705cfSriastradh * the post gen2 PCI layout. 107703b705cfSriastradh */ 107803b705cfSriastradh return dev->regions[gen < 030 ? 0 : 2].size; 107903b705cfSriastradh} 108003b705cfSriastradh 108103b705cfSriastradhstatic size_t 108203b705cfSriastradhtotal_ram_size(void) 108303b705cfSriastradh{ 108403b705cfSriastradh#ifdef HAVE_STRUCT_SYSINFO_TOTALRAM 108503b705cfSriastradh struct sysinfo info; 108603b705cfSriastradh if (sysinfo(&info) == 0) 108763ef14f0Smrg return (size_t)info.totalram * info.mem_unit; 108803b705cfSriastradh#endif 108903b705cfSriastradh 109003b705cfSriastradh#ifdef _SC_PHYS_PAGES 109163ef14f0Smrg return (size_t)sysconf(_SC_PHYS_PAGES) * sysconf(_SC_PAGE_SIZE); 109203b705cfSriastradh#endif 109303b705cfSriastradh 109403b705cfSriastradh return 0; 109503b705cfSriastradh} 109603b705cfSriastradh 109703b705cfSriastradhstatic unsigned 109803b705cfSriastradhcpu_cache_size__cpuid4(void) 109903b705cfSriastradh{ 11009a906b70Schristos /* Deterministic Cache Parameters (Function 04h)": 110103b705cfSriastradh * When EAX is initialized to a value of 4, the CPUID instruction 110203b705cfSriastradh * returns deterministic cache information in the EAX, EBX, ECX 110303b705cfSriastradh * and EDX registers. This function requires ECX be initialized 110403b705cfSriastradh * with an index which indicates which cache to return information 110503b705cfSriastradh * about. The OS is expected to call this function (CPUID.4) with 110603b705cfSriastradh * ECX = 0, 1, 2, until EAX[4:0] == 0, indicating no more caches. 110703b705cfSriastradh * The order in which the caches are returned is not specified 110803b705cfSriastradh * and may change at Intel's discretion. 110903b705cfSriastradh * 111003b705cfSriastradh * Calculating the Cache Size in bytes: 111103b705cfSriastradh * = (Ways +1) * (Partitions +1) * (Line Size +1) * (Sets +1) 111203b705cfSriastradh */ 111303b705cfSriastradh 111403b705cfSriastradh unsigned int eax, ebx, ecx, edx; 111503b705cfSriastradh unsigned int llc_size = 0; 11169a906b70Schristos int cnt; 111703b705cfSriastradh 111803b705cfSriastradh if (__get_cpuid_max(BASIC_CPUID, NULL) < 4) 111903b705cfSriastradh return 0; 112003b705cfSriastradh 11219a906b70Schristos cnt = 0; 112203b705cfSriastradh do { 112303b705cfSriastradh unsigned associativity, line_partitions, line_size, sets; 112403b705cfSriastradh 112503b705cfSriastradh __cpuid_count(4, cnt++, eax, ebx, ecx, edx); 112603b705cfSriastradh 112703b705cfSriastradh if ((eax & 0x1f) == 0) 112803b705cfSriastradh break; 112903b705cfSriastradh 113003b705cfSriastradh associativity = ((ebx >> 22) & 0x3ff) + 1; 113103b705cfSriastradh line_partitions = ((ebx >> 12) & 0x3ff) + 1; 113203b705cfSriastradh line_size = (ebx & 0xfff) + 1; 113303b705cfSriastradh sets = ecx + 1; 113403b705cfSriastradh 113503b705cfSriastradh llc_size = associativity * line_partitions * line_size * sets; 113603b705cfSriastradh } while (1); 113703b705cfSriastradh 113803b705cfSriastradh return llc_size; 113903b705cfSriastradh} 114003b705cfSriastradh 114103b705cfSriastradhstatic unsigned 114203b705cfSriastradhcpu_cache_size(void) 114303b705cfSriastradh{ 114403b705cfSriastradh unsigned size; 114503b705cfSriastradh FILE *file; 114603b705cfSriastradh 114703b705cfSriastradh size = cpu_cache_size__cpuid4(); 114803b705cfSriastradh if (size) 114903b705cfSriastradh return size; 115003b705cfSriastradh 115103b705cfSriastradh file = fopen("/proc/cpuinfo", "r"); 115203b705cfSriastradh if (file) { 115303b705cfSriastradh size_t len = 0; 115403b705cfSriastradh char *line = NULL; 115503b705cfSriastradh while (getline(&line, &len, file) != -1) { 115603b705cfSriastradh int kb; 115703b705cfSriastradh if (sscanf(line, "cache size : %d KB", &kb) == 1) { 115803b705cfSriastradh /* Paranoid check against gargantuan caches */ 115903b705cfSriastradh if (kb <= 1<<20) 116003b705cfSriastradh size = kb * 1024; 116103b705cfSriastradh break; 116203b705cfSriastradh } 116303b705cfSriastradh } 116403b705cfSriastradh free(line); 116503b705cfSriastradh fclose(file); 116603b705cfSriastradh } 116703b705cfSriastradh 116803b705cfSriastradh if (size == 0) 116903b705cfSriastradh size = 64 * 1024; 117003b705cfSriastradh 117103b705cfSriastradh return size; 117203b705cfSriastradh} 117303b705cfSriastradh 117403b705cfSriastradhstatic int gem_param(struct kgem *kgem, int name) 117503b705cfSriastradh{ 117603b705cfSriastradh drm_i915_getparam_t gp; 117703b705cfSriastradh int v = -1; /* No param uses the sign bit, reserve it for errors */ 117803b705cfSriastradh 117903b705cfSriastradh VG_CLEAR(gp); 118003b705cfSriastradh gp.param = name; 118103b705cfSriastradh gp.value = &v; 11829a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GETPARAM, &gp)) 118303b705cfSriastradh return -1; 118403b705cfSriastradh 118503b705cfSriastradh VG(VALGRIND_MAKE_MEM_DEFINED(&v, sizeof(v))); 118603b705cfSriastradh return v; 118703b705cfSriastradh} 118803b705cfSriastradh 118903b705cfSriastradhstatic bool test_has_execbuffer2(struct kgem *kgem) 119003b705cfSriastradh{ 119103b705cfSriastradh struct drm_i915_gem_execbuffer2 execbuf; 119203b705cfSriastradh 119303b705cfSriastradh memset(&execbuf, 0, sizeof(execbuf)); 119403b705cfSriastradh execbuf.buffer_count = 1; 119503b705cfSriastradh 11969a906b70Schristos return do_ioctl(kgem->fd, 119703b705cfSriastradh DRM_IOCTL_I915_GEM_EXECBUFFER2, 11989a906b70Schristos &execbuf) == -EFAULT; 119903b705cfSriastradh} 120003b705cfSriastradh 120103b705cfSriastradhstatic bool test_has_no_reloc(struct kgem *kgem) 120203b705cfSriastradh{ 120303b705cfSriastradh if (DBG_NO_FAST_RELOC) 120403b705cfSriastradh return false; 120503b705cfSriastradh 120603b705cfSriastradh return gem_param(kgem, LOCAL_I915_PARAM_HAS_NO_RELOC) > 0; 120703b705cfSriastradh} 120803b705cfSriastradh 120903b705cfSriastradhstatic bool test_has_handle_lut(struct kgem *kgem) 121003b705cfSriastradh{ 121103b705cfSriastradh if (DBG_NO_HANDLE_LUT) 121203b705cfSriastradh return false; 121303b705cfSriastradh 121403b705cfSriastradh return gem_param(kgem, LOCAL_I915_PARAM_HAS_HANDLE_LUT) > 0; 121503b705cfSriastradh} 121603b705cfSriastradh 121703b705cfSriastradhstatic bool test_has_wt(struct kgem *kgem) 121803b705cfSriastradh{ 121903b705cfSriastradh if (DBG_NO_WT) 122003b705cfSriastradh return false; 122103b705cfSriastradh 122203b705cfSriastradh return gem_param(kgem, LOCAL_I915_PARAM_HAS_WT) > 0; 122303b705cfSriastradh} 122403b705cfSriastradh 122503b705cfSriastradhstatic bool test_has_semaphores_enabled(struct kgem *kgem) 122603b705cfSriastradh{ 122703b705cfSriastradh FILE *file; 122803b705cfSriastradh bool detected = false; 122903b705cfSriastradh int ret; 123003b705cfSriastradh 123103b705cfSriastradh if (DBG_NO_SEMAPHORES) 123203b705cfSriastradh return false; 123303b705cfSriastradh 123403b705cfSriastradh ret = gem_param(kgem, LOCAL_I915_PARAM_HAS_SEMAPHORES); 123503b705cfSriastradh if (ret != -1) 123603b705cfSriastradh return ret > 0; 123703b705cfSriastradh 123803b705cfSriastradh file = fopen("/sys/module/i915/parameters/semaphores", "r"); 123903b705cfSriastradh if (file) { 124003b705cfSriastradh int value; 124103b705cfSriastradh if (fscanf(file, "%d", &value) == 1) 124203b705cfSriastradh detected = value != 0; 124303b705cfSriastradh fclose(file); 124403b705cfSriastradh } 124503b705cfSriastradh 124603b705cfSriastradh return detected; 124703b705cfSriastradh} 124803b705cfSriastradh 124903b705cfSriastradhstatic bool is_hw_supported(struct kgem *kgem, 125003b705cfSriastradh struct pci_device *dev) 125103b705cfSriastradh{ 125203b705cfSriastradh if (DBG_NO_HW) 125303b705cfSriastradh return false; 125403b705cfSriastradh 125503b705cfSriastradh if (!test_has_execbuffer2(kgem)) 125603b705cfSriastradh return false; 125703b705cfSriastradh 125803b705cfSriastradh if (kgem->gen == (unsigned)-1) /* unknown chipset, assume future gen */ 125903b705cfSriastradh return kgem->has_blt; 126003b705cfSriastradh 126103b705cfSriastradh /* Although pre-855gm the GMCH is fubar, it works mostly. So 126203b705cfSriastradh * let the user decide through "NoAccel" whether or not to risk 126303b705cfSriastradh * hw acceleration. 126403b705cfSriastradh */ 126503b705cfSriastradh 12669a906b70Schristos if (kgem->gen == 060 && dev && dev->revision < 8) { 126703b705cfSriastradh /* pre-production SNB with dysfunctional BLT */ 126803b705cfSriastradh return false; 126903b705cfSriastradh } 127003b705cfSriastradh 127103b705cfSriastradh if (kgem->gen >= 060) /* Only if the kernel supports the BLT ring */ 127203b705cfSriastradh return kgem->has_blt; 127303b705cfSriastradh 127403b705cfSriastradh return true; 127503b705cfSriastradh} 127603b705cfSriastradh 127703b705cfSriastradhstatic bool test_has_relaxed_fencing(struct kgem *kgem) 127803b705cfSriastradh{ 127903b705cfSriastradh if (kgem->gen < 040) { 128003b705cfSriastradh if (DBG_NO_RELAXED_FENCING) 128103b705cfSriastradh return false; 128203b705cfSriastradh 128303b705cfSriastradh return gem_param(kgem, LOCAL_I915_PARAM_HAS_RELAXED_FENCING) > 0; 128403b705cfSriastradh } else 128503b705cfSriastradh return true; 128603b705cfSriastradh} 128703b705cfSriastradh 128863ef14f0Smrgstatic bool test_has_coherent_mmap_gtt(struct kgem *kgem) 128963ef14f0Smrg{ 129063ef14f0Smrg if (DBG_NO_COHERENT_MMAP_GTT) 129163ef14f0Smrg return false; 129263ef14f0Smrg 129363ef14f0Smrg return gem_param(kgem, LOCAL_I915_PARAM_MMAP_GTT_COHERENT) > 0; 129463ef14f0Smrg} 129563ef14f0Smrg 129603b705cfSriastradhstatic bool test_has_llc(struct kgem *kgem) 129703b705cfSriastradh{ 129803b705cfSriastradh int has_llc = -1; 129903b705cfSriastradh 130003b705cfSriastradh if (DBG_NO_LLC) 130103b705cfSriastradh return false; 130203b705cfSriastradh 1303813957e3Ssnj has_llc = gem_param(kgem, LOCAL_I915_PARAM_HAS_LLC); 130403b705cfSriastradh if (has_llc == -1) { 130503b705cfSriastradh DBG(("%s: no kernel/drm support for HAS_LLC, assuming support for LLC based on GPU generation\n", __FUNCTION__)); 130603b705cfSriastradh has_llc = kgem->gen >= 060; 130703b705cfSriastradh } 130803b705cfSriastradh 130903b705cfSriastradh return has_llc; 131003b705cfSriastradh} 131103b705cfSriastradh 1312813957e3Ssnjstatic bool test_has_wc_mmap(struct kgem *kgem) 1313813957e3Ssnj{ 1314813957e3Ssnj struct local_i915_gem_mmap2 wc; 1315813957e3Ssnj bool ret; 1316813957e3Ssnj 1317813957e3Ssnj if (DBG_NO_WC_MMAP) 1318813957e3Ssnj return false; 1319813957e3Ssnj 132063ef14f0Smrg /* XXX See https://bugs.freedesktop.org/show_bug.cgi?id=90841 */ 132163ef14f0Smrg if (kgem->gen < 033) 132263ef14f0Smrg return false; 132363ef14f0Smrg 1324813957e3Ssnj if (gem_param(kgem, LOCAL_I915_PARAM_MMAP_VERSION) < 1) 1325813957e3Ssnj return false; 1326813957e3Ssnj 1327813957e3Ssnj VG_CLEAR(wc); 1328813957e3Ssnj wc.handle = gem_create(kgem->fd, 1); 1329813957e3Ssnj wc.offset = 0; 1330813957e3Ssnj wc.size = 4096; 1331813957e3Ssnj wc.flags = I915_MMAP_WC; 1332813957e3Ssnj ret = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_MMAP_v2, &wc) == 0; 1333813957e3Ssnj gem_close(kgem->fd, wc.handle); 1334813957e3Ssnj 1335813957e3Ssnj return ret; 1336813957e3Ssnj} 1337813957e3Ssnj 133803b705cfSriastradhstatic bool test_has_caching(struct kgem *kgem) 133903b705cfSriastradh{ 134003b705cfSriastradh uint32_t handle; 134103b705cfSriastradh bool ret; 134203b705cfSriastradh 134303b705cfSriastradh if (DBG_NO_CACHE_LEVEL) 134403b705cfSriastradh return false; 134503b705cfSriastradh 134603b705cfSriastradh /* Incoherent blt and sampler hangs the GPU */ 134703b705cfSriastradh if (kgem->gen == 040) 134803b705cfSriastradh return false; 134903b705cfSriastradh 135003b705cfSriastradh handle = gem_create(kgem->fd, 1); 135103b705cfSriastradh if (handle == 0) 135203b705cfSriastradh return false; 135303b705cfSriastradh 135403b705cfSriastradh ret = gem_set_caching(kgem->fd, handle, UNCACHED); 135503b705cfSriastradh gem_close(kgem->fd, handle); 135603b705cfSriastradh return ret; 135703b705cfSriastradh} 135803b705cfSriastradh 135903b705cfSriastradhstatic bool test_has_userptr(struct kgem *kgem) 136003b705cfSriastradh{ 136163ef14f0Smrg struct local_i915_gem_userptr arg; 136203b705cfSriastradh void *ptr; 136303b705cfSriastradh 136403b705cfSriastradh if (DBG_NO_USERPTR) 136503b705cfSriastradh return false; 136603b705cfSriastradh 136703b705cfSriastradh /* Incoherent blt and sampler hangs the GPU */ 136803b705cfSriastradh if (kgem->gen == 040) 136903b705cfSriastradh return false; 137003b705cfSriastradh 137103b705cfSriastradh if (posix_memalign(&ptr, PAGE_SIZE, PAGE_SIZE)) 137203b705cfSriastradh return false; 137303b705cfSriastradh 137463ef14f0Smrg VG_CLEAR(arg); 137563ef14f0Smrg arg.user_ptr = (uintptr_t)ptr; 137663ef14f0Smrg arg.user_size = PAGE_SIZE; 137763ef14f0Smrg arg.flags = I915_USERPTR_UNSYNCHRONIZED; 137803b705cfSriastradh 137963ef14f0Smrg if (DBG_NO_UNSYNCHRONIZED_USERPTR || 138063ef14f0Smrg do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg)) { 138163ef14f0Smrg arg.flags &= ~I915_USERPTR_UNSYNCHRONIZED; 138263ef14f0Smrg if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_USERPTR, &arg)) 138363ef14f0Smrg arg.handle = 0; 138463ef14f0Smrg /* Leak the userptr bo to keep the mmu_notifier alive */ 138563ef14f0Smrg } else { 138663ef14f0Smrg gem_close(kgem->fd, arg.handle); 138763ef14f0Smrg free(ptr); 138863ef14f0Smrg } 138963ef14f0Smrg 139063ef14f0Smrg return arg.handle != 0; 139103b705cfSriastradh} 139203b705cfSriastradh 139303b705cfSriastradhstatic bool test_has_create2(struct kgem *kgem) 139403b705cfSriastradh{ 139503b705cfSriastradh#if defined(USE_CREATE2) 139603b705cfSriastradh struct local_i915_gem_create2 args; 139703b705cfSriastradh 139803b705cfSriastradh if (DBG_NO_CREATE2) 139903b705cfSriastradh return false; 140003b705cfSriastradh 140103b705cfSriastradh memset(&args, 0, sizeof(args)); 140203b705cfSriastradh args.size = PAGE_SIZE; 140303b705cfSriastradh args.caching = DISPLAY; 14049a906b70Schristos if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_CREATE2, &args) == 0) 140503b705cfSriastradh gem_close(kgem->fd, args.handle); 140603b705cfSriastradh 140703b705cfSriastradh return args.handle != 0; 140803b705cfSriastradh#else 140903b705cfSriastradh return false; 141003b705cfSriastradh#endif 141103b705cfSriastradh} 141203b705cfSriastradh 141363ef14f0Smrgstatic bool test_can_blt_y(struct kgem *kgem) 141403b705cfSriastradh{ 141563ef14f0Smrg struct drm_i915_gem_exec_object2 object; 141663ef14f0Smrg uint32_t batch[] = { 141763ef14f0Smrg#define MI_LOAD_REGISTER_IMM (0x22<<23 | (3-2)) 141863ef14f0Smrg#define BCS_SWCTRL 0x22200 141963ef14f0Smrg#define BCS_SRC_Y (1 << 0) 142063ef14f0Smrg#define BCS_DST_Y (1 << 1) 142163ef14f0Smrg MI_LOAD_REGISTER_IMM, 142263ef14f0Smrg BCS_SWCTRL, 142363ef14f0Smrg (BCS_SRC_Y | BCS_DST_Y) << 16 | (BCS_SRC_Y | BCS_DST_Y), 142463ef14f0Smrg 142563ef14f0Smrg MI_LOAD_REGISTER_IMM, 142663ef14f0Smrg BCS_SWCTRL, 142763ef14f0Smrg (BCS_SRC_Y | BCS_DST_Y) << 16, 142863ef14f0Smrg 142963ef14f0Smrg MI_BATCH_BUFFER_END, 143063ef14f0Smrg 0, 143163ef14f0Smrg }; 143263ef14f0Smrg int ret; 143363ef14f0Smrg 143463ef14f0Smrg if (DBG_NO_BLT_Y) 143503b705cfSriastradh return false; 143603b705cfSriastradh 143763ef14f0Smrg if (kgem->gen < 060) 143863ef14f0Smrg return false; 143963ef14f0Smrg 144063ef14f0Smrg memset(&object, 0, sizeof(object)); 144163ef14f0Smrg object.handle = gem_create(kgem->fd, 1); 144263ef14f0Smrg 144363ef14f0Smrg ret = gem_write(kgem->fd, object.handle, 0, sizeof(batch), batch); 144463ef14f0Smrg if (ret == 0) { 144563ef14f0Smrg struct drm_i915_gem_execbuffer2 execbuf; 144663ef14f0Smrg 144763ef14f0Smrg memset(&execbuf, 0, sizeof(execbuf)); 144863ef14f0Smrg execbuf.buffers_ptr = (uintptr_t)&object; 144963ef14f0Smrg execbuf.buffer_count = 1; 145063ef14f0Smrg execbuf.flags = KGEM_BLT; 145163ef14f0Smrg 145263ef14f0Smrg ret = do_ioctl(kgem->fd, 145363ef14f0Smrg DRM_IOCTL_I915_GEM_EXECBUFFER2, 145463ef14f0Smrg &execbuf); 145563ef14f0Smrg } 145663ef14f0Smrg gem_close(kgem->fd, object.handle); 145763ef14f0Smrg 145863ef14f0Smrg return ret == 0; 145903b705cfSriastradh} 146003b705cfSriastradh 146163ef14f0Smrgstatic bool gem_set_tiling(int fd, uint32_t handle, int tiling, int stride) 146203b705cfSriastradh{ 146363ef14f0Smrg struct drm_i915_gem_set_tiling set_tiling; 146463ef14f0Smrg 146563ef14f0Smrg if (DBG_NO_TILING) 146603b705cfSriastradh return false; 146703b705cfSriastradh 146863ef14f0Smrg VG_CLEAR(set_tiling); 146963ef14f0Smrg set_tiling.handle = handle; 147063ef14f0Smrg set_tiling.tiling_mode = tiling; 147163ef14f0Smrg set_tiling.stride = stride; 147263ef14f0Smrg 147363ef14f0Smrg if (ioctl(fd, DRM_IOCTL_I915_GEM_SET_TILING, &set_tiling) == 0) 147463ef14f0Smrg return set_tiling.tiling_mode == tiling; 147563ef14f0Smrg 147663ef14f0Smrg return false; 147703b705cfSriastradh} 147803b705cfSriastradh 147963ef14f0Smrgstatic bool test_can_scanout_y(struct kgem *kgem) 148003b705cfSriastradh{ 148163ef14f0Smrg struct drm_mode_fb_cmd arg; 148263ef14f0Smrg bool ret = false; 148363ef14f0Smrg 148463ef14f0Smrg if (DBG_NO_SCANOUT_Y) 148563ef14f0Smrg return false; 148663ef14f0Smrg 148763ef14f0Smrg VG_CLEAR(arg); 148863ef14f0Smrg arg.width = 32; 148963ef14f0Smrg arg.height = 32; 149063ef14f0Smrg arg.pitch = 4*32; 149163ef14f0Smrg arg.bpp = 32; 149263ef14f0Smrg arg.depth = 24; 149363ef14f0Smrg arg.handle = gem_create(kgem->fd, 1); 149463ef14f0Smrg 149563ef14f0Smrg if (gem_set_tiling(kgem->fd, arg.handle, I915_TILING_Y, arg.pitch)) 149663ef14f0Smrg ret = do_ioctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &arg) == 0; 149763ef14f0Smrg if (!ret) { 149863ef14f0Smrg struct local_mode_fb_cmd2 { 149963ef14f0Smrg uint32_t fb_id; 150063ef14f0Smrg uint32_t width, height; 150163ef14f0Smrg uint32_t pixel_format; 150263ef14f0Smrg uint32_t flags; 150363ef14f0Smrg 150463ef14f0Smrg uint32_t handles[4]; 150563ef14f0Smrg uint32_t pitches[4]; 150663ef14f0Smrg uint32_t offsets[4]; 150763ef14f0Smrg uint64_t modifiers[4]; 150863ef14f0Smrg } f; 150963ef14f0Smrg#define LOCAL_IOCTL_MODE_ADDFB2 DRM_IOWR(0xb8, struct local_mode_fb_cmd2) 151063ef14f0Smrg memset(&f, 0, sizeof(f)); 151163ef14f0Smrg f.width = arg.width; 151263ef14f0Smrg f.height = arg.height; 151363ef14f0Smrg f.handles[0] = arg.handle; 151463ef14f0Smrg f.pitches[0] = arg.pitch; 151563ef14f0Smrg f.modifiers[0] = (uint64_t)1 << 56 | 2; /* MOD_Y_TILED */ 151663ef14f0Smrg f.pixel_format = 'X' | 'R' << 8 | '2' << 16 | '4' << 24; /* XRGB8888 */ 151763ef14f0Smrg f.flags = 1 << 1; /* + modifier */ 151863ef14f0Smrg if (drmIoctl(kgem->fd, LOCAL_IOCTL_MODE_ADDFB2, &f) == 0) { 151963ef14f0Smrg ret = true; 152063ef14f0Smrg arg.fb_id = f.fb_id; 152163ef14f0Smrg } 152263ef14f0Smrg } 152363ef14f0Smrg do_ioctl(kgem->fd, DRM_IOCTL_MODE_RMFB, &arg.fb_id); 152463ef14f0Smrg gem_close(kgem->fd, arg.handle); 152563ef14f0Smrg 152663ef14f0Smrg return ret; 152703b705cfSriastradh} 152803b705cfSriastradh 152963ef14f0Smrgstatic bool test_has_dirtyfb(struct kgem *kgem) 15309a906b70Schristos{ 153163ef14f0Smrg struct drm_mode_fb_cmd create; 153263ef14f0Smrg bool ret = false; 15339a906b70Schristos 153463ef14f0Smrg if (DBG_NO_DIRTYFB) 153563ef14f0Smrg return false; 15369a906b70Schristos 153763ef14f0Smrg VG_CLEAR(create); 153863ef14f0Smrg create.width = 32; 153963ef14f0Smrg create.height = 32; 154063ef14f0Smrg create.pitch = 4*32; 154163ef14f0Smrg create.bpp = 24; 154263ef14f0Smrg create.depth = 32; /* {bpp:24, depth:32} -> x8r8g8b8 */ 154363ef14f0Smrg create.handle = gem_create(kgem->fd, 1); 154463ef14f0Smrg if (create.handle == 0) 154563ef14f0Smrg return false; 15469a906b70Schristos 154763ef14f0Smrg if (drmIoctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &create) == 0) { 154863ef14f0Smrg struct drm_mode_fb_dirty_cmd dirty; 154963ef14f0Smrg 155063ef14f0Smrg memset(&dirty, 0, sizeof(dirty)); 155163ef14f0Smrg dirty.fb_id = create.fb_id; 155263ef14f0Smrg ret = drmIoctl(kgem->fd, 155363ef14f0Smrg DRM_IOCTL_MODE_DIRTYFB, 155463ef14f0Smrg &dirty) == 0; 155563ef14f0Smrg 155663ef14f0Smrg /* XXX There may be multiple levels of DIRTYFB, depending on 155763ef14f0Smrg * whether the kernel thinks tracking dirty regions is 155863ef14f0Smrg * beneficial vs flagging the whole fb as dirty. 155963ef14f0Smrg */ 156063ef14f0Smrg 156163ef14f0Smrg drmIoctl(kgem->fd, 156263ef14f0Smrg DRM_IOCTL_MODE_RMFB, 156363ef14f0Smrg &create.fb_id); 15649a906b70Schristos } 156563ef14f0Smrg gem_close(kgem->fd, create.handle); 15669a906b70Schristos 156763ef14f0Smrg return ret; 15689a906b70Schristos} 15699a906b70Schristos 157063ef14f0Smrgstatic bool test_has_secure_batches(struct kgem *kgem) 15719a906b70Schristos{ 157263ef14f0Smrg if (DBG_NO_SECURE_BATCHES) 157363ef14f0Smrg return false; 15749a906b70Schristos 157563ef14f0Smrg return gem_param(kgem, LOCAL_I915_PARAM_HAS_SECURE_BATCHES) > 0; 157663ef14f0Smrg} 15779a906b70Schristos 157863ef14f0Smrgstatic bool test_has_pinned_batches(struct kgem *kgem) 157963ef14f0Smrg{ 158063ef14f0Smrg if (DBG_NO_PINNED_BATCHES) 158163ef14f0Smrg return false; 15829a906b70Schristos 158363ef14f0Smrg return gem_param(kgem, LOCAL_I915_PARAM_HAS_PINNED_BATCHES) > 0; 15849a906b70Schristos} 15859a906b70Schristos 158603b705cfSriastradhstatic bool kgem_init_pinned_batches(struct kgem *kgem) 158703b705cfSriastradh{ 158803b705cfSriastradh int count[2] = { 16, 4 }; 158903b705cfSriastradh int size[2] = { 1, 4 }; 159063ef14f0Smrg int ret = 0; 159103b705cfSriastradh int n, i; 159203b705cfSriastradh 159363ef14f0Smrg if (unlikely(kgem->wedged)) 159403b705cfSriastradh return true; 159503b705cfSriastradh 159603b705cfSriastradh for (n = 0; n < ARRAY_SIZE(count); n++) { 159703b705cfSriastradh for (i = 0; i < count[n]; i++) { 159803b705cfSriastradh struct drm_i915_gem_pin pin; 159903b705cfSriastradh struct kgem_bo *bo; 160003b705cfSriastradh 160103b705cfSriastradh VG_CLEAR(pin); 160203b705cfSriastradh 160303b705cfSriastradh pin.handle = gem_create(kgem->fd, size[n]); 160403b705cfSriastradh if (pin.handle == 0) 160503b705cfSriastradh goto err; 160603b705cfSriastradh 160703b705cfSriastradh DBG(("%s: new handle=%d, num_pages=%d\n", 160803b705cfSriastradh __FUNCTION__, pin.handle, size[n])); 160903b705cfSriastradh 161003b705cfSriastradh bo = __kgem_bo_alloc(pin.handle, size[n]); 161103b705cfSriastradh if (bo == NULL) { 161203b705cfSriastradh gem_close(kgem->fd, pin.handle); 161303b705cfSriastradh goto err; 161403b705cfSriastradh } 161503b705cfSriastradh 161603b705cfSriastradh pin.alignment = 0; 161763ef14f0Smrg ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_PIN, &pin); 161863ef14f0Smrg if (ret) { 161903b705cfSriastradh gem_close(kgem->fd, pin.handle); 16209a906b70Schristos free(bo); 162103b705cfSriastradh goto err; 162203b705cfSriastradh } 162303b705cfSriastradh bo->presumed_offset = pin.offset; 162403b705cfSriastradh debug_alloc__bo(kgem, bo); 162503b705cfSriastradh list_add(&bo->list, &kgem->pinned_batches[n]); 162603b705cfSriastradh } 162703b705cfSriastradh } 162803b705cfSriastradh 162903b705cfSriastradh return true; 163003b705cfSriastradh 163103b705cfSriastradherr: 163203b705cfSriastradh for (n = 0; n < ARRAY_SIZE(kgem->pinned_batches); n++) { 163303b705cfSriastradh while (!list_is_empty(&kgem->pinned_batches[n])) { 163403b705cfSriastradh kgem_bo_destroy(kgem, 163503b705cfSriastradh list_first_entry(&kgem->pinned_batches[n], 163603b705cfSriastradh struct kgem_bo, list)); 163703b705cfSriastradh } 163803b705cfSriastradh } 163903b705cfSriastradh 164063ef14f0Smrg /* If we fail to pin some memory for 830gm/845g, we need to disable 164163ef14f0Smrg * acceleration as otherwise the machine will eventually fail. However, 164263ef14f0Smrg * the kernel started arbitrarily rejecting PIN, so hope for the best 164363ef14f0Smrg * if the ioctl no longer works. 164463ef14f0Smrg */ 164563ef14f0Smrg if (ret != -ENODEV && kgem->gen == 020) 164663ef14f0Smrg return false; 164763ef14f0Smrg 164863ef14f0Smrg kgem->has_pinned_batches = false; 164963ef14f0Smrg 165003b705cfSriastradh /* For simplicity populate the lists with a single unpinned bo */ 165103b705cfSriastradh for (n = 0; n < ARRAY_SIZE(count); n++) { 165203b705cfSriastradh struct kgem_bo *bo; 165303b705cfSriastradh uint32_t handle; 165403b705cfSriastradh 165503b705cfSriastradh handle = gem_create(kgem->fd, size[n]); 165603b705cfSriastradh if (handle == 0) 165763ef14f0Smrg return false; 165803b705cfSriastradh 165903b705cfSriastradh bo = __kgem_bo_alloc(handle, size[n]); 166003b705cfSriastradh if (bo == NULL) { 166103b705cfSriastradh gem_close(kgem->fd, handle); 166263ef14f0Smrg return false; 166303b705cfSriastradh } 166403b705cfSriastradh 166503b705cfSriastradh debug_alloc__bo(kgem, bo); 166603b705cfSriastradh list_add(&bo->list, &kgem->pinned_batches[n]); 166703b705cfSriastradh } 166863ef14f0Smrg return true; 166903b705cfSriastradh} 167003b705cfSriastradh 167103b705cfSriastradhstatic void kgem_init_swizzling(struct kgem *kgem) 167203b705cfSriastradh{ 1673813957e3Ssnj struct local_i915_gem_get_tiling_v2 { 1674813957e3Ssnj uint32_t handle; 1675813957e3Ssnj uint32_t tiling_mode; 1676813957e3Ssnj uint32_t swizzle_mode; 1677813957e3Ssnj uint32_t phys_swizzle_mode; 1678813957e3Ssnj } tiling; 1679813957e3Ssnj#define LOCAL_IOCTL_I915_GEM_GET_TILING DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_GET_TILING, struct local_i915_gem_get_tiling_v2) 168003b705cfSriastradh 168163ef14f0Smrg memset(&tiling, 0, sizeof(tiling)); 168203b705cfSriastradh tiling.handle = gem_create(kgem->fd, 1); 168303b705cfSriastradh if (!tiling.handle) 168403b705cfSriastradh return; 168503b705cfSriastradh 168603b705cfSriastradh if (!gem_set_tiling(kgem->fd, tiling.handle, I915_TILING_X, 512)) 168703b705cfSriastradh goto out; 168803b705cfSriastradh 1689813957e3Ssnj if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_GET_TILING, &tiling)) 1690813957e3Ssnj goto out; 1691813957e3Ssnj 169263ef14f0Smrg DBG(("%s: swizzle_mode=%d, phys_swizzle_mode=%d\n", 169363ef14f0Smrg __FUNCTION__, tiling.swizzle_mode, tiling.phys_swizzle_mode)); 169463ef14f0Smrg 169563ef14f0Smrg kgem->can_fence = 169663ef14f0Smrg !DBG_NO_TILING && 169763ef14f0Smrg tiling.swizzle_mode != I915_BIT_6_SWIZZLE_UNKNOWN; 169863ef14f0Smrg 169963ef14f0Smrg if (kgem->gen < 050 && tiling.phys_swizzle_mode != tiling.swizzle_mode) 170003b705cfSriastradh goto out; 170103b705cfSriastradh 170263ef14f0Smrg if (!DBG_NO_DETILING) 170363ef14f0Smrg choose_memcpy_tiled_x(kgem, 170463ef14f0Smrg tiling.swizzle_mode, 170563ef14f0Smrg __to_sna(kgem)->cpu_features); 170603b705cfSriastradhout: 170703b705cfSriastradh gem_close(kgem->fd, tiling.handle); 170863ef14f0Smrg DBG(("%s: can fence?=%d\n", __FUNCTION__, kgem->can_fence)); 170903b705cfSriastradh} 171003b705cfSriastradh 1711813957e3Ssnjstatic void kgem_fixup_relocs(struct kgem *kgem, struct kgem_bo *bo, int shrink) 1712813957e3Ssnj{ 1713813957e3Ssnj int n; 1714813957e3Ssnj 1715813957e3Ssnj bo->target_handle = kgem->has_handle_lut ? kgem->nexec : bo->handle; 1716813957e3Ssnj 1717813957e3Ssnj assert(kgem->nreloc__self <= 256); 1718813957e3Ssnj if (kgem->nreloc__self == 0) 1719813957e3Ssnj return; 1720813957e3Ssnj 1721813957e3Ssnj DBG(("%s: fixing up %d%s self-relocations to handle=%p, presumed-offset=%llx\n", 1722813957e3Ssnj __FUNCTION__, kgem->nreloc__self, 1723813957e3Ssnj kgem->nreloc__self == 256 ? "+" : "", 1724813957e3Ssnj bo->handle, (long long)bo->presumed_offset)); 1725813957e3Ssnj for (n = 0; n < kgem->nreloc__self; n++) { 1726813957e3Ssnj int i = kgem->reloc__self[n]; 172763ef14f0Smrg uint64_t addr; 1728813957e3Ssnj 1729813957e3Ssnj assert(kgem->reloc[i].target_handle == ~0U); 1730813957e3Ssnj kgem->reloc[i].target_handle = bo->target_handle; 1731813957e3Ssnj kgem->reloc[i].presumed_offset = bo->presumed_offset; 1732813957e3Ssnj 1733813957e3Ssnj if (kgem->reloc[i].read_domains == I915_GEM_DOMAIN_INSTRUCTION) { 1734813957e3Ssnj DBG(("%s: moving base of self-reloc[%d:%d] %d -> %d\n", 1735813957e3Ssnj __FUNCTION__, n, i, 1736813957e3Ssnj kgem->reloc[i].delta, 1737813957e3Ssnj kgem->reloc[i].delta - shrink)); 1738813957e3Ssnj 1739813957e3Ssnj kgem->reloc[i].delta -= shrink; 1740813957e3Ssnj } 174163ef14f0Smrg addr = (int)kgem->reloc[i].delta + bo->presumed_offset; 174263ef14f0Smrg kgem->batch[kgem->reloc[i].offset/sizeof(uint32_t)] = addr; 174363ef14f0Smrg if (kgem->gen >= 0100) 174463ef14f0Smrg kgem->batch[kgem->reloc[i].offset/sizeof(uint32_t) + 1] = addr >> 32; 1745813957e3Ssnj } 1746813957e3Ssnj 1747813957e3Ssnj if (n == 256) { 1748813957e3Ssnj for (n = kgem->reloc__self[255]; n < kgem->nreloc; n++) { 1749813957e3Ssnj if (kgem->reloc[n].target_handle == ~0U) { 175063ef14f0Smrg uint64_t addr; 175163ef14f0Smrg 1752813957e3Ssnj kgem->reloc[n].target_handle = bo->target_handle; 1753813957e3Ssnj kgem->reloc[n].presumed_offset = bo->presumed_offset; 1754813957e3Ssnj 1755813957e3Ssnj if (kgem->reloc[n].read_domains == I915_GEM_DOMAIN_INSTRUCTION) { 1756813957e3Ssnj DBG(("%s: moving base of reloc[%d] %d -> %d\n", 1757813957e3Ssnj __FUNCTION__, n, 1758813957e3Ssnj kgem->reloc[n].delta, 1759813957e3Ssnj kgem->reloc[n].delta - shrink)); 1760813957e3Ssnj kgem->reloc[n].delta -= shrink; 1761813957e3Ssnj } 176263ef14f0Smrg 176363ef14f0Smrg addr = (int)kgem->reloc[n].delta + bo->presumed_offset; 176463ef14f0Smrg kgem->batch[kgem->reloc[n].offset/sizeof(uint32_t)] = addr; 176563ef14f0Smrg if (kgem->gen >= 0100) 176663ef14f0Smrg kgem->batch[kgem->reloc[n].offset/sizeof(uint32_t) + 1] = addr >> 32; 1767813957e3Ssnj } 1768813957e3Ssnj } 1769813957e3Ssnj } 1770813957e3Ssnj 1771813957e3Ssnj if (shrink) { 1772813957e3Ssnj DBG(("%s: shrinking by %d\n", __FUNCTION__, shrink)); 1773813957e3Ssnj for (n = 0; n < kgem->nreloc; n++) { 1774813957e3Ssnj if (kgem->reloc[n].offset >= sizeof(uint32_t)*kgem->nbatch) 1775813957e3Ssnj kgem->reloc[n].offset -= shrink; 1776813957e3Ssnj } 1777813957e3Ssnj } 1778813957e3Ssnj} 1779813957e3Ssnj 178063ef14f0Smrgstatic int kgem_bo_wait(struct kgem *kgem, struct kgem_bo *bo) 178163ef14f0Smrg{ 178263ef14f0Smrg struct local_i915_gem_wait { 178363ef14f0Smrg uint32_t handle; 178463ef14f0Smrg uint32_t flags; 178563ef14f0Smrg int64_t timeout; 178663ef14f0Smrg } wait; 178763ef14f0Smrg#define LOCAL_I915_GEM_WAIT 0x2c 178863ef14f0Smrg#define LOCAL_IOCTL_I915_GEM_WAIT DRM_IOWR(DRM_COMMAND_BASE + LOCAL_I915_GEM_WAIT, struct local_i915_gem_wait) 178963ef14f0Smrg int ret; 179063ef14f0Smrg 179163ef14f0Smrg DBG(("%s: waiting for handle=%d\n", __FUNCTION__, bo->handle)); 179263ef14f0Smrg if (bo->rq == NULL) 179363ef14f0Smrg return 0; 179463ef14f0Smrg 179563ef14f0Smrg VG_CLEAR(wait); 179663ef14f0Smrg wait.handle = bo->handle; 179763ef14f0Smrg wait.flags = 0; 179863ef14f0Smrg wait.timeout = -1; 179963ef14f0Smrg ret = do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_WAIT, &wait); 180063ef14f0Smrg if (ret) { 180163ef14f0Smrg struct drm_i915_gem_set_domain set_domain; 180263ef14f0Smrg 180363ef14f0Smrg VG_CLEAR(set_domain); 180463ef14f0Smrg set_domain.handle = bo->handle; 180563ef14f0Smrg set_domain.read_domains = I915_GEM_DOMAIN_GTT; 180663ef14f0Smrg set_domain.write_domain = I915_GEM_DOMAIN_GTT; 180763ef14f0Smrg ret = do_ioctl(kgem->fd, 180863ef14f0Smrg DRM_IOCTL_I915_GEM_SET_DOMAIN, 180963ef14f0Smrg &set_domain); 181063ef14f0Smrg } 181163ef14f0Smrg 181263ef14f0Smrg if (ret == 0) 181363ef14f0Smrg __kgem_retire_requests_upto(kgem, bo); 181463ef14f0Smrg 181563ef14f0Smrg return ret; 181663ef14f0Smrg} 181763ef14f0Smrg 1818813957e3Ssnjstatic struct kgem_bo *kgem_new_batch(struct kgem *kgem) 1819813957e3Ssnj{ 1820813957e3Ssnj struct kgem_bo *last; 1821813957e3Ssnj unsigned flags; 1822813957e3Ssnj 1823813957e3Ssnj last = kgem->batch_bo; 1824813957e3Ssnj if (last) { 1825813957e3Ssnj kgem_fixup_relocs(kgem, last, 0); 1826813957e3Ssnj kgem->batch = NULL; 1827813957e3Ssnj } 1828813957e3Ssnj 1829813957e3Ssnj if (kgem->batch) { 1830813957e3Ssnj assert(last == NULL); 1831813957e3Ssnj return NULL; 1832813957e3Ssnj } 1833813957e3Ssnj 1834813957e3Ssnj flags = CREATE_CPU_MAP | CREATE_NO_THROTTLE; 1835813957e3Ssnj if (!kgem->has_llc) 1836813957e3Ssnj flags |= CREATE_UNCACHED; 1837813957e3Ssnj 183863ef14f0Smrgrestart: 1839813957e3Ssnj kgem->batch_bo = kgem_create_linear(kgem, 1840813957e3Ssnj sizeof(uint32_t)*kgem->batch_size, 1841813957e3Ssnj flags); 1842813957e3Ssnj if (kgem->batch_bo) 1843813957e3Ssnj kgem->batch = kgem_bo_map__cpu(kgem, kgem->batch_bo); 1844813957e3Ssnj if (kgem->batch == NULL) { 184563ef14f0Smrg int ring = kgem->ring == KGEM_BLT; 184663ef14f0Smrg assert(ring < ARRAY_SIZE(kgem->requests)); 184763ef14f0Smrg 1848813957e3Ssnj if (kgem->batch_bo) { 1849813957e3Ssnj kgem_bo_destroy(kgem, kgem->batch_bo); 1850813957e3Ssnj kgem->batch_bo = NULL; 1851813957e3Ssnj } 1852813957e3Ssnj 185363ef14f0Smrg if (!list_is_empty(&kgem->requests[ring])) { 185463ef14f0Smrg struct kgem_request *rq; 185563ef14f0Smrg 185663ef14f0Smrg rq = list_first_entry(&kgem->requests[ring], 185763ef14f0Smrg struct kgem_request, list); 185863ef14f0Smrg assert(rq->ring == ring); 185963ef14f0Smrg assert(rq->bo); 186063ef14f0Smrg assert(RQ(rq->bo->rq) == rq); 186163ef14f0Smrg if (kgem_bo_wait(kgem, rq->bo) == 0) 186263ef14f0Smrg goto restart; 186363ef14f0Smrg } 186463ef14f0Smrg 186563ef14f0Smrg if (flags & CREATE_NO_THROTTLE) { 186663ef14f0Smrg flags &= ~CREATE_NO_THROTTLE; 186763ef14f0Smrg if (kgem_cleanup_cache(kgem)) 186863ef14f0Smrg goto restart; 186963ef14f0Smrg } 187063ef14f0Smrg 187163ef14f0Smrg DBG(("%s: unable to map batch bo, mallocing(size=%d)\n", 187263ef14f0Smrg __FUNCTION__, sizeof(uint32_t)*kgem->batch_size)); 1873813957e3Ssnj if (posix_memalign((void **)&kgem->batch, PAGE_SIZE, 1874813957e3Ssnj ALIGN(sizeof(uint32_t) * kgem->batch_size, PAGE_SIZE))) { 1875813957e3Ssnj ERR(("%s: batch allocation failed, disabling acceleration\n", __FUNCTION__)); 1876813957e3Ssnj __kgem_set_wedged(kgem); 1877813957e3Ssnj } 1878813957e3Ssnj } else { 1879813957e3Ssnj DBG(("%s: allocated and mapped batch handle=%d [size=%d]\n", 1880813957e3Ssnj __FUNCTION__, kgem->batch_bo->handle, 1881813957e3Ssnj sizeof(uint32_t)*kgem->batch_size)); 1882813957e3Ssnj kgem_bo_sync__cpu(kgem, kgem->batch_bo); 1883813957e3Ssnj } 1884813957e3Ssnj 1885813957e3Ssnj DBG(("%s: using last batch handle=%d\n", 1886813957e3Ssnj __FUNCTION__, last ? last->handle : 0)); 1887813957e3Ssnj return last; 1888813957e3Ssnj} 188903b705cfSriastradh 189063ef14f0Smrgstatic void 189163ef14f0Smrgno_retire(struct kgem *kgem) 189263ef14f0Smrg{ 189363ef14f0Smrg (void)kgem; 189463ef14f0Smrg} 189563ef14f0Smrg 189663ef14f0Smrgstatic void 189763ef14f0Smrgno_expire(struct kgem *kgem) 189863ef14f0Smrg{ 189963ef14f0Smrg (void)kgem; 190063ef14f0Smrg} 190163ef14f0Smrg 190263ef14f0Smrgstatic void 190363ef14f0Smrgno_context_switch(struct kgem *kgem, int new_mode) 190463ef14f0Smrg{ 190563ef14f0Smrg (void)kgem; 190663ef14f0Smrg (void)new_mode; 190763ef14f0Smrg} 190863ef14f0Smrg 190963ef14f0Smrgstatic uint64_t get_gtt_size(int fd) 191003b705cfSriastradh{ 191103b705cfSriastradh struct drm_i915_gem_get_aperture aperture; 191263ef14f0Smrg struct local_i915_gem_context_param { 191363ef14f0Smrg uint32_t context; 191463ef14f0Smrg uint32_t size; 191563ef14f0Smrg uint64_t param; 191663ef14f0Smrg#define LOCAL_CONTEXT_PARAM_BAN_PERIOD 0x1 191763ef14f0Smrg#define LOCAL_CONTEXT_PARAM_NO_ZEROMAP 0x2 191863ef14f0Smrg#define LOCAL_CONTEXT_PARAM_GTT_SIZE 0x3 191963ef14f0Smrg uint64_t value; 192063ef14f0Smrg } p; 192163ef14f0Smrg#define LOCAL_I915_GEM_CONTEXT_GETPARAM 0x34 192263ef14f0Smrg#define LOCAL_IOCTL_I915_GEM_CONTEXT_GETPARAM DRM_IOWR (DRM_COMMAND_BASE + LOCAL_I915_GEM_CONTEXT_GETPARAM, struct local_i915_gem_context_param) 192363ef14f0Smrg 192463ef14f0Smrg memset(&aperture, 0, sizeof(aperture)); 192563ef14f0Smrg 192663ef14f0Smrg memset(&p, 0, sizeof(p)); 192763ef14f0Smrg p.param = LOCAL_CONTEXT_PARAM_GTT_SIZE; 192863ef14f0Smrg if (drmIoctl(fd, LOCAL_IOCTL_I915_GEM_CONTEXT_GETPARAM, &p) == 0) 192963ef14f0Smrg aperture.aper_size = p.value; 193063ef14f0Smrg if (aperture.aper_size == 0) 193163ef14f0Smrg (void)drmIoctl(fd, DRM_IOCTL_I915_GEM_GET_APERTURE, &aperture); 193263ef14f0Smrg if (aperture.aper_size == 0) 193363ef14f0Smrg aperture.aper_size = 64*1024*1024; 193463ef14f0Smrg 193563ef14f0Smrg DBG(("%s: aperture size %lld, available now %lld\n", 193663ef14f0Smrg __FUNCTION__, 193763ef14f0Smrg (long long)aperture.aper_size, 193863ef14f0Smrg (long long)aperture.aper_available_size)); 193963ef14f0Smrg 194063ef14f0Smrg /* clamp aperture to uint32_t for simplicity */ 194163ef14f0Smrg if (aperture.aper_size > 0xc0000000) 194263ef14f0Smrg aperture.aper_size = 0xc0000000; 194363ef14f0Smrg 194463ef14f0Smrg return aperture.aper_size; 194563ef14f0Smrg} 194663ef14f0Smrg 194763ef14f0Smrgvoid kgem_init(struct kgem *kgem, int fd, struct pci_device *dev, unsigned gen) 194863ef14f0Smrg{ 194903b705cfSriastradh size_t totalram; 195003b705cfSriastradh unsigned half_gpu_max; 195103b705cfSriastradh unsigned int i, j; 195263ef14f0Smrg uint64_t gtt_size; 195303b705cfSriastradh 195403b705cfSriastradh DBG(("%s: fd=%d, gen=%d\n", __FUNCTION__, fd, gen)); 195503b705cfSriastradh 195603b705cfSriastradh kgem->fd = fd; 195703b705cfSriastradh kgem->gen = gen; 195803b705cfSriastradh 195963ef14f0Smrg kgem->retire = no_retire; 196063ef14f0Smrg kgem->expire = no_expire; 196163ef14f0Smrg kgem->context_switch = no_context_switch; 196263ef14f0Smrg 196303b705cfSriastradh list_init(&kgem->requests[0]); 196403b705cfSriastradh list_init(&kgem->requests[1]); 196503b705cfSriastradh list_init(&kgem->batch_buffers); 196603b705cfSriastradh list_init(&kgem->active_buffers); 196703b705cfSriastradh list_init(&kgem->flushing); 196803b705cfSriastradh list_init(&kgem->large); 196903b705cfSriastradh list_init(&kgem->large_inactive); 197003b705cfSriastradh list_init(&kgem->snoop); 197103b705cfSriastradh list_init(&kgem->scanout); 197203b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->pinned_batches); i++) 197303b705cfSriastradh list_init(&kgem->pinned_batches[i]); 197403b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) 197503b705cfSriastradh list_init(&kgem->inactive[i]); 197603b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->active); i++) { 197703b705cfSriastradh for (j = 0; j < ARRAY_SIZE(kgem->active[i]); j++) 197803b705cfSriastradh list_init(&kgem->active[i][j]); 197903b705cfSriastradh } 198003b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->vma); i++) { 198103b705cfSriastradh for (j = 0; j < ARRAY_SIZE(kgem->vma[i].inactive); j++) 198203b705cfSriastradh list_init(&kgem->vma[i].inactive[j]); 198303b705cfSriastradh } 198403b705cfSriastradh kgem->vma[MAP_GTT].count = -MAX_GTT_VMA_CACHE; 198503b705cfSriastradh kgem->vma[MAP_CPU].count = -MAX_CPU_VMA_CACHE; 198603b705cfSriastradh 198703b705cfSriastradh kgem->has_blt = gem_param(kgem, LOCAL_I915_PARAM_HAS_BLT) > 0; 198803b705cfSriastradh DBG(("%s: has BLT ring? %d\n", __FUNCTION__, 198903b705cfSriastradh kgem->has_blt)); 199003b705cfSriastradh 199103b705cfSriastradh kgem->has_relaxed_delta = 199203b705cfSriastradh gem_param(kgem, LOCAL_I915_PARAM_HAS_RELAXED_DELTA) > 0; 199303b705cfSriastradh DBG(("%s: has relaxed delta? %d\n", __FUNCTION__, 199403b705cfSriastradh kgem->has_relaxed_delta)); 199503b705cfSriastradh 199603b705cfSriastradh kgem->has_relaxed_fencing = test_has_relaxed_fencing(kgem); 199703b705cfSriastradh DBG(("%s: has relaxed fencing? %d\n", __FUNCTION__, 199803b705cfSriastradh kgem->has_relaxed_fencing)); 199903b705cfSriastradh 200063ef14f0Smrg kgem->has_coherent_mmap_gtt = test_has_coherent_mmap_gtt(kgem); 200163ef14f0Smrg DBG(("%s: has coherent writes into GTT maps? %d\n", __FUNCTION__, 200263ef14f0Smrg kgem->has_coherent_mmap_gtt)); 200363ef14f0Smrg 200403b705cfSriastradh kgem->has_llc = test_has_llc(kgem); 200503b705cfSriastradh DBG(("%s: has shared last-level-cache? %d\n", __FUNCTION__, 200603b705cfSriastradh kgem->has_llc)); 200703b705cfSriastradh 200803b705cfSriastradh kgem->has_wt = test_has_wt(kgem); 200903b705cfSriastradh DBG(("%s: has write-through caching for scanouts? %d\n", __FUNCTION__, 201003b705cfSriastradh kgem->has_wt)); 201103b705cfSriastradh 2012813957e3Ssnj kgem->has_wc_mmap = test_has_wc_mmap(kgem); 2013813957e3Ssnj DBG(("%s: has wc-mmapping? %d\n", __FUNCTION__, 2014813957e3Ssnj kgem->has_wc_mmap)); 2015813957e3Ssnj 201603b705cfSriastradh kgem->has_caching = test_has_caching(kgem); 201703b705cfSriastradh DBG(("%s: has set-cache-level? %d\n", __FUNCTION__, 201803b705cfSriastradh kgem->has_caching)); 201903b705cfSriastradh 202003b705cfSriastradh kgem->has_userptr = test_has_userptr(kgem); 202103b705cfSriastradh DBG(("%s: has userptr? %d\n", __FUNCTION__, 202203b705cfSriastradh kgem->has_userptr)); 202303b705cfSriastradh 202403b705cfSriastradh kgem->has_create2 = test_has_create2(kgem); 202503b705cfSriastradh DBG(("%s: has create2? %d\n", __FUNCTION__, 202603b705cfSriastradh kgem->has_create2)); 202703b705cfSriastradh 202803b705cfSriastradh kgem->has_no_reloc = test_has_no_reloc(kgem); 202903b705cfSriastradh DBG(("%s: has no-reloc? %d\n", __FUNCTION__, 203003b705cfSriastradh kgem->has_no_reloc)); 203103b705cfSriastradh 203203b705cfSriastradh kgem->has_handle_lut = test_has_handle_lut(kgem); 203303b705cfSriastradh DBG(("%s: has handle-lut? %d\n", __FUNCTION__, 203403b705cfSriastradh kgem->has_handle_lut)); 203503b705cfSriastradh 203603b705cfSriastradh kgem->has_semaphores = false; 203703b705cfSriastradh if (kgem->has_blt && test_has_semaphores_enabled(kgem)) 203803b705cfSriastradh kgem->has_semaphores = true; 203903b705cfSriastradh DBG(("%s: semaphores enabled? %d\n", __FUNCTION__, 204003b705cfSriastradh kgem->has_semaphores)); 204103b705cfSriastradh 204203b705cfSriastradh kgem->can_blt_cpu = gen >= 030; 204303b705cfSriastradh DBG(("%s: can blt to cpu? %d\n", __FUNCTION__, 204403b705cfSriastradh kgem->can_blt_cpu)); 204503b705cfSriastradh 204663ef14f0Smrg kgem->can_blt_y = test_can_blt_y(kgem); 204763ef14f0Smrg DBG(("%s: can blit to Y-tiled surfaces? %d\n", __FUNCTION__, 204863ef14f0Smrg kgem->can_blt_y)); 204963ef14f0Smrg 20509a906b70Schristos kgem->can_render_y = gen != 021 && (gen >> 3) != 4; 20519a906b70Schristos DBG(("%s: can render to Y-tiled surfaces? %d\n", __FUNCTION__, 20529a906b70Schristos kgem->can_render_y)); 20539a906b70Schristos 205463ef14f0Smrg kgem->can_scanout_y = test_can_scanout_y(kgem); 205563ef14f0Smrg DBG(("%s: can scanout Y-tiled surfaces? %d\n", __FUNCTION__, 205663ef14f0Smrg kgem->can_scanout_y)); 205763ef14f0Smrg 205863ef14f0Smrg kgem->has_dirtyfb = test_has_dirtyfb(kgem); 205963ef14f0Smrg DBG(("%s: has dirty fb? %d\n", __FUNCTION__, kgem->has_dirtyfb)); 206063ef14f0Smrg 206103b705cfSriastradh kgem->has_secure_batches = test_has_secure_batches(kgem); 206203b705cfSriastradh DBG(("%s: can use privileged batchbuffers? %d\n", __FUNCTION__, 206303b705cfSriastradh kgem->has_secure_batches)); 206403b705cfSriastradh 206503b705cfSriastradh kgem->has_pinned_batches = test_has_pinned_batches(kgem); 206603b705cfSriastradh DBG(("%s: can use pinned batchbuffers (to avoid CS w/a)? %d\n", __FUNCTION__, 206703b705cfSriastradh kgem->has_pinned_batches)); 206803b705cfSriastradh 206903b705cfSriastradh if (!is_hw_supported(kgem, dev)) { 207003b705cfSriastradh xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING, 207103b705cfSriastradh "Detected unsupported/dysfunctional hardware, disabling acceleration.\n"); 2072813957e3Ssnj __kgem_set_wedged(kgem); 20739a906b70Schristos } else if (__kgem_throttle(kgem, false)) { 207403b705cfSriastradh xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING, 207503b705cfSriastradh "Detected a hung GPU, disabling acceleration.\n"); 2076813957e3Ssnj __kgem_set_wedged(kgem); 207703b705cfSriastradh } 207803b705cfSriastradh 2079813957e3Ssnj kgem->batch_size = UINT16_MAX & ~7; 208003b705cfSriastradh if (gen == 020 && !kgem->has_pinned_batches) 208103b705cfSriastradh /* Limited to what we can pin */ 208203b705cfSriastradh kgem->batch_size = 4*1024; 208303b705cfSriastradh if (gen == 022) 208403b705cfSriastradh /* 865g cannot handle a batch spanning multiple pages */ 208503b705cfSriastradh kgem->batch_size = PAGE_SIZE / sizeof(uint32_t); 20869a906b70Schristos if (gen >= 070) 208703b705cfSriastradh kgem->batch_size = 16*1024; 208803b705cfSriastradh if (!kgem->has_relaxed_delta && kgem->batch_size > 4*1024) 208903b705cfSriastradh kgem->batch_size = 4*1024; 209003b705cfSriastradh 209163ef14f0Smrg if (!kgem_init_pinned_batches(kgem)) { 209203b705cfSriastradh xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING, 209303b705cfSriastradh "Unable to reserve memory for GPU, disabling acceleration.\n"); 2094813957e3Ssnj __kgem_set_wedged(kgem); 209503b705cfSriastradh } 209603b705cfSriastradh 209703b705cfSriastradh DBG(("%s: maximum batch size? %d\n", __FUNCTION__, 209803b705cfSriastradh kgem->batch_size)); 2099813957e3Ssnj kgem_new_batch(kgem); 210003b705cfSriastradh 210103b705cfSriastradh kgem->half_cpu_cache_pages = cpu_cache_size() >> 13; 210203b705cfSriastradh DBG(("%s: last-level cache size: %d bytes, threshold in pages: %d\n", 210303b705cfSriastradh __FUNCTION__, cpu_cache_size(), kgem->half_cpu_cache_pages)); 210403b705cfSriastradh 210503b705cfSriastradh kgem->next_request = __kgem_request_alloc(kgem); 210603b705cfSriastradh 210703b705cfSriastradh DBG(("%s: cpu bo enabled %d: llc? %d, set-cache-level? %d, userptr? %d\n", __FUNCTION__, 210803b705cfSriastradh !DBG_NO_CPU && (kgem->has_llc | kgem->has_userptr | kgem->has_caching), 210903b705cfSriastradh kgem->has_llc, kgem->has_caching, kgem->has_userptr)); 211003b705cfSriastradh 211163ef14f0Smrg gtt_size = get_gtt_size(fd); 211263ef14f0Smrg kgem->aperture_total = gtt_size; 211363ef14f0Smrg kgem->aperture_high = gtt_size * 3/4; 211463ef14f0Smrg kgem->aperture_low = gtt_size * 1/3; 211503b705cfSriastradh if (gen < 033) { 211603b705cfSriastradh /* Severe alignment penalties */ 211703b705cfSriastradh kgem->aperture_high /= 2; 211803b705cfSriastradh kgem->aperture_low /= 2; 211903b705cfSriastradh } 212063ef14f0Smrg DBG(("%s: aperture low=%u [%u], high=%u [%u]\n", __FUNCTION__, 212103b705cfSriastradh kgem->aperture_low, kgem->aperture_low / (1024*1024), 212203b705cfSriastradh kgem->aperture_high, kgem->aperture_high / (1024*1024))); 212303b705cfSriastradh 21249a906b70Schristos kgem->aperture_mappable = 256 * 1024 * 1024; 21259a906b70Schristos if (dev != NULL) 21269a906b70Schristos kgem->aperture_mappable = agp_aperture_size(dev, gen); 212763ef14f0Smrg if (kgem->aperture_mappable == 0 || kgem->aperture_mappable > gtt_size) 212863ef14f0Smrg kgem->aperture_mappable = gtt_size; 212903b705cfSriastradh DBG(("%s: aperture mappable=%d [%d MiB]\n", __FUNCTION__, 213003b705cfSriastradh kgem->aperture_mappable, kgem->aperture_mappable / (1024*1024))); 213103b705cfSriastradh 21329a906b70Schristos kgem->aperture_fenceable = MIN(256*1024*1024, kgem->aperture_mappable); 21339a906b70Schristos DBG(("%s: aperture fenceable=%d [%d MiB]\n", __FUNCTION__, 21349a906b70Schristos kgem->aperture_fenceable, kgem->aperture_fenceable / (1024*1024))); 21359a906b70Schristos 213603b705cfSriastradh kgem->buffer_size = 64 * 1024; 213703b705cfSriastradh while (kgem->buffer_size < kgem->aperture_mappable >> 10) 213803b705cfSriastradh kgem->buffer_size *= 2; 213903b705cfSriastradh if (kgem->buffer_size >> 12 > kgem->half_cpu_cache_pages) 214003b705cfSriastradh kgem->buffer_size = kgem->half_cpu_cache_pages << 12; 214103b705cfSriastradh kgem->buffer_size = 1 << __fls(kgem->buffer_size); 214203b705cfSriastradh DBG(("%s: buffer size=%d [%d KiB]\n", __FUNCTION__, 214303b705cfSriastradh kgem->buffer_size, kgem->buffer_size / 1024)); 214403b705cfSriastradh assert(kgem->buffer_size); 214503b705cfSriastradh 214603b705cfSriastradh kgem->max_object_size = 3 * (kgem->aperture_high >> 12) << 10; 214703b705cfSriastradh kgem->max_gpu_size = kgem->max_object_size; 214803b705cfSriastradh if (!kgem->has_llc && kgem->max_gpu_size > MAX_CACHE_SIZE) 214903b705cfSriastradh kgem->max_gpu_size = MAX_CACHE_SIZE; 215003b705cfSriastradh 215103b705cfSriastradh totalram = total_ram_size(); 215203b705cfSriastradh if (totalram == 0) { 215303b705cfSriastradh DBG(("%s: total ram size unknown, assuming maximum of total aperture\n", 215403b705cfSriastradh __FUNCTION__)); 215503b705cfSriastradh totalram = kgem->aperture_total; 215603b705cfSriastradh } 215763ef14f0Smrg DBG(("%s: total ram=%lld\n", __FUNCTION__, (long long)totalram)); 215803b705cfSriastradh if (kgem->max_object_size > totalram / 2) 215903b705cfSriastradh kgem->max_object_size = totalram / 2; 216003b705cfSriastradh if (kgem->max_gpu_size > totalram / 4) 216103b705cfSriastradh kgem->max_gpu_size = totalram / 4; 216203b705cfSriastradh 21639a906b70Schristos if (kgem->aperture_high > totalram / 2) { 21649a906b70Schristos kgem->aperture_high = totalram / 2; 21659a906b70Schristos kgem->aperture_low = kgem->aperture_high / 4; 21669a906b70Schristos DBG(("%s: reduced aperture watermaks to fit into ram; low=%d [%d], high=%d [%d]\n", __FUNCTION__, 21679a906b70Schristos kgem->aperture_low, kgem->aperture_low / (1024*1024), 21689a906b70Schristos kgem->aperture_high, kgem->aperture_high / (1024*1024))); 21699a906b70Schristos } 21709a906b70Schristos 217103b705cfSriastradh kgem->max_cpu_size = kgem->max_object_size; 217203b705cfSriastradh 217303b705cfSriastradh half_gpu_max = kgem->max_gpu_size / 2; 217403b705cfSriastradh kgem->max_copy_tile_size = (MAX_CACHE_SIZE + 1)/2; 217503b705cfSriastradh if (kgem->max_copy_tile_size > half_gpu_max) 217603b705cfSriastradh kgem->max_copy_tile_size = half_gpu_max; 217703b705cfSriastradh 217803b705cfSriastradh if (kgem->has_llc) 217903b705cfSriastradh kgem->max_upload_tile_size = kgem->max_copy_tile_size; 218003b705cfSriastradh else 21819a906b70Schristos kgem->max_upload_tile_size = kgem->aperture_fenceable / 4; 218203b705cfSriastradh if (kgem->max_upload_tile_size > half_gpu_max) 218303b705cfSriastradh kgem->max_upload_tile_size = half_gpu_max; 218403b705cfSriastradh if (kgem->max_upload_tile_size > kgem->aperture_high/2) 218503b705cfSriastradh kgem->max_upload_tile_size = kgem->aperture_high/2; 218603b705cfSriastradh if (kgem->max_upload_tile_size > kgem->aperture_low) 218703b705cfSriastradh kgem->max_upload_tile_size = kgem->aperture_low; 218803b705cfSriastradh if (kgem->max_upload_tile_size < 16*PAGE_SIZE) 218903b705cfSriastradh kgem->max_upload_tile_size = 16*PAGE_SIZE; 219003b705cfSriastradh 219103b705cfSriastradh kgem->large_object_size = MAX_CACHE_SIZE; 219203b705cfSriastradh if (kgem->large_object_size > half_gpu_max) 219303b705cfSriastradh kgem->large_object_size = half_gpu_max; 219403b705cfSriastradh if (kgem->max_copy_tile_size > kgem->aperture_high/2) 219503b705cfSriastradh kgem->max_copy_tile_size = kgem->aperture_high/2; 219603b705cfSriastradh if (kgem->max_copy_tile_size > kgem->aperture_low) 219703b705cfSriastradh kgem->max_copy_tile_size = kgem->aperture_low; 219803b705cfSriastradh if (kgem->max_copy_tile_size < 16*PAGE_SIZE) 219903b705cfSriastradh kgem->max_copy_tile_size = 16*PAGE_SIZE; 220003b705cfSriastradh 220103b705cfSriastradh if (kgem->has_llc | kgem->has_caching | kgem->has_userptr) { 220203b705cfSriastradh if (kgem->large_object_size > kgem->max_cpu_size) 220303b705cfSriastradh kgem->large_object_size = kgem->max_cpu_size; 220403b705cfSriastradh } else 220503b705cfSriastradh kgem->max_cpu_size = 0; 220603b705cfSriastradh if (DBG_NO_CPU) 220703b705cfSriastradh kgem->max_cpu_size = 0; 220803b705cfSriastradh 220963ef14f0Smrg DBG(("%s: maximum object size=%u\n", 221003b705cfSriastradh __FUNCTION__, kgem->max_object_size)); 221163ef14f0Smrg DBG(("%s: large object thresold=%u\n", 221203b705cfSriastradh __FUNCTION__, kgem->large_object_size)); 221363ef14f0Smrg DBG(("%s: max object sizes (gpu=%u, cpu=%u, tile upload=%u, copy=%u)\n", 221403b705cfSriastradh __FUNCTION__, 221503b705cfSriastradh kgem->max_gpu_size, kgem->max_cpu_size, 221603b705cfSriastradh kgem->max_upload_tile_size, kgem->max_copy_tile_size)); 221703b705cfSriastradh 221803b705cfSriastradh /* Convert the aperture thresholds to pages */ 22199a906b70Schristos kgem->aperture_mappable /= PAGE_SIZE; 22209a906b70Schristos kgem->aperture_fenceable /= PAGE_SIZE; 222103b705cfSriastradh kgem->aperture_low /= PAGE_SIZE; 222203b705cfSriastradh kgem->aperture_high /= PAGE_SIZE; 22239a906b70Schristos kgem->aperture_total /= PAGE_SIZE; 222403b705cfSriastradh 222503b705cfSriastradh kgem->fence_max = gem_param(kgem, I915_PARAM_NUM_FENCES_AVAIL) - 2; 222603b705cfSriastradh if ((int)kgem->fence_max < 0) 222703b705cfSriastradh kgem->fence_max = 5; /* minimum safe value for all hw */ 222803b705cfSriastradh DBG(("%s: max fences=%d\n", __FUNCTION__, kgem->fence_max)); 222903b705cfSriastradh 223003b705cfSriastradh kgem->batch_flags_base = 0; 223103b705cfSriastradh if (kgem->has_no_reloc) 223203b705cfSriastradh kgem->batch_flags_base |= LOCAL_I915_EXEC_NO_RELOC; 223303b705cfSriastradh if (kgem->has_handle_lut) 223403b705cfSriastradh kgem->batch_flags_base |= LOCAL_I915_EXEC_HANDLE_LUT; 223503b705cfSriastradh if (kgem->has_pinned_batches) 223603b705cfSriastradh kgem->batch_flags_base |= LOCAL_I915_EXEC_IS_PINNED; 223703b705cfSriastradh 223803b705cfSriastradh kgem_init_swizzling(kgem); 223903b705cfSriastradh} 224003b705cfSriastradh 224103b705cfSriastradh/* XXX hopefully a good approximation */ 22429a906b70Schristosstatic uint32_t kgem_get_unique_id(struct kgem *kgem) 224303b705cfSriastradh{ 224403b705cfSriastradh uint32_t id; 224503b705cfSriastradh id = ++kgem->unique_id; 224603b705cfSriastradh if (id == 0) 224703b705cfSriastradh id = ++kgem->unique_id; 224803b705cfSriastradh return id; 224903b705cfSriastradh} 225003b705cfSriastradh 225103b705cfSriastradhinline static uint32_t kgem_pitch_alignment(struct kgem *kgem, unsigned flags) 225203b705cfSriastradh{ 225303b705cfSriastradh if (flags & CREATE_PRIME) 225403b705cfSriastradh return 256; 225503b705cfSriastradh if (flags & CREATE_SCANOUT) 225603b705cfSriastradh return 64; 2257813957e3Ssnj if (kgem->gen >= 0100) 2258813957e3Ssnj return 32; 22599a906b70Schristos return 8; 226003b705cfSriastradh} 226103b705cfSriastradh 22629a906b70Schristosvoid kgem_get_tile_size(struct kgem *kgem, int tiling, int pitch, 226303b705cfSriastradh int *tile_width, int *tile_height, int *tile_size) 226403b705cfSriastradh{ 226503b705cfSriastradh if (kgem->gen <= 030) { 226603b705cfSriastradh if (tiling) { 226703b705cfSriastradh if (kgem->gen < 030) { 226803b705cfSriastradh *tile_width = 128; 226903b705cfSriastradh *tile_height = 16; 227003b705cfSriastradh *tile_size = 2048; 227103b705cfSriastradh } else { 227203b705cfSriastradh *tile_width = 512; 227303b705cfSriastradh *tile_height = 8; 227403b705cfSriastradh *tile_size = 4096; 227503b705cfSriastradh } 227603b705cfSriastradh } else { 227703b705cfSriastradh *tile_width = 1; 227803b705cfSriastradh *tile_height = 1; 227903b705cfSriastradh *tile_size = 1; 228003b705cfSriastradh } 228103b705cfSriastradh } else switch (tiling) { 228203b705cfSriastradh default: 228303b705cfSriastradh case I915_TILING_NONE: 228403b705cfSriastradh *tile_width = 1; 228503b705cfSriastradh *tile_height = 1; 228603b705cfSriastradh *tile_size = 1; 228703b705cfSriastradh break; 228803b705cfSriastradh case I915_TILING_X: 228903b705cfSriastradh *tile_width = 512; 229003b705cfSriastradh *tile_height = 8; 229103b705cfSriastradh *tile_size = 4096; 229203b705cfSriastradh break; 229303b705cfSriastradh case I915_TILING_Y: 229403b705cfSriastradh *tile_width = 128; 229503b705cfSriastradh *tile_height = 32; 229603b705cfSriastradh *tile_size = 4096; 229703b705cfSriastradh break; 229803b705cfSriastradh } 22999a906b70Schristos 23009a906b70Schristos /* Force offset alignment to tile-row */ 23019a906b70Schristos if (tiling && kgem->gen < 033) 23029a906b70Schristos *tile_width = pitch; 230303b705cfSriastradh} 230403b705cfSriastradh 230503b705cfSriastradhstatic uint32_t kgem_surface_size(struct kgem *kgem, 230603b705cfSriastradh bool relaxed_fencing, 230703b705cfSriastradh unsigned flags, 230803b705cfSriastradh uint32_t width, 230903b705cfSriastradh uint32_t height, 231003b705cfSriastradh uint32_t bpp, 231103b705cfSriastradh uint32_t tiling, 231203b705cfSriastradh uint32_t *pitch) 231303b705cfSriastradh{ 231403b705cfSriastradh uint32_t tile_width, tile_height; 231503b705cfSriastradh uint32_t size; 231603b705cfSriastradh 231703b705cfSriastradh assert(width <= MAXSHORT); 231803b705cfSriastradh assert(height <= MAXSHORT); 231903b705cfSriastradh assert(bpp >= 8); 232003b705cfSriastradh 232103b705cfSriastradh if (kgem->gen <= 030) { 232203b705cfSriastradh if (tiling) { 232303b705cfSriastradh if (kgem->gen < 030) { 232403b705cfSriastradh tile_width = 128; 23259a906b70Schristos tile_height = 16; 232603b705cfSriastradh } else { 232703b705cfSriastradh tile_width = 512; 23289a906b70Schristos tile_height = 8; 232903b705cfSriastradh } 233003b705cfSriastradh } else { 233103b705cfSriastradh tile_width = 2 * bpp >> 3; 233203b705cfSriastradh tile_width = ALIGN(tile_width, 233303b705cfSriastradh kgem_pitch_alignment(kgem, flags)); 23349a906b70Schristos tile_height = 1; 233503b705cfSriastradh } 233603b705cfSriastradh } else switch (tiling) { 233703b705cfSriastradh default: 233803b705cfSriastradh case I915_TILING_NONE: 233903b705cfSriastradh tile_width = 2 * bpp >> 3; 234003b705cfSriastradh tile_width = ALIGN(tile_width, 234103b705cfSriastradh kgem_pitch_alignment(kgem, flags)); 23429a906b70Schristos tile_height = 1; 234303b705cfSriastradh break; 234403b705cfSriastradh 234503b705cfSriastradh case I915_TILING_X: 234603b705cfSriastradh tile_width = 512; 23479a906b70Schristos tile_height = 8; 234803b705cfSriastradh break; 234903b705cfSriastradh case I915_TILING_Y: 235003b705cfSriastradh tile_width = 128; 23519a906b70Schristos tile_height = 32; 235203b705cfSriastradh break; 235303b705cfSriastradh } 23549a906b70Schristos /* XXX align to an even tile row */ 23559a906b70Schristos if (!kgem->has_relaxed_fencing) 23569a906b70Schristos tile_height *= 2; 235703b705cfSriastradh 235803b705cfSriastradh *pitch = ALIGN(width * bpp / 8, tile_width); 235903b705cfSriastradh height = ALIGN(height, tile_height); 23609a906b70Schristos DBG(("%s: tile_width=%d, tile_height=%d => aligned pitch=%d, height=%d\n", 23619a906b70Schristos __FUNCTION__, tile_width, tile_height, *pitch, height)); 23629a906b70Schristos 236303b705cfSriastradh if (kgem->gen >= 040) 236403b705cfSriastradh return PAGE_ALIGN(*pitch * height); 236503b705cfSriastradh 236603b705cfSriastradh /* If it is too wide for the blitter, don't even bother. */ 236703b705cfSriastradh if (tiling != I915_TILING_NONE) { 23689a906b70Schristos if (*pitch > 8192) { 23699a906b70Schristos DBG(("%s: too wide for tiled surface (pitch=%d, limit=%d)\n", 23709a906b70Schristos __FUNCTION__, *pitch, 8192)); 237103b705cfSriastradh return 0; 23729a906b70Schristos } 237303b705cfSriastradh 237403b705cfSriastradh for (size = tile_width; size < *pitch; size <<= 1) 237503b705cfSriastradh ; 237603b705cfSriastradh *pitch = size; 237703b705cfSriastradh } else { 23789a906b70Schristos if (*pitch >= 32768) { 23799a906b70Schristos DBG(("%s: too wide for linear surface (pitch=%d, limit=%d)\n", 23809a906b70Schristos __FUNCTION__, *pitch, 32767)); 238103b705cfSriastradh return 0; 23829a906b70Schristos } 238303b705cfSriastradh } 238403b705cfSriastradh 238503b705cfSriastradh size = *pitch * height; 238603b705cfSriastradh if (relaxed_fencing || tiling == I915_TILING_NONE) 238703b705cfSriastradh return PAGE_ALIGN(size); 238803b705cfSriastradh 23899a906b70Schristos /* We need to allocate a pot fence region for a tiled buffer. */ 239003b705cfSriastradh if (kgem->gen < 030) 239103b705cfSriastradh tile_width = 512 * 1024; 239203b705cfSriastradh else 239303b705cfSriastradh tile_width = 1024 * 1024; 239403b705cfSriastradh while (tile_width < size) 239503b705cfSriastradh tile_width *= 2; 239603b705cfSriastradh return tile_width; 239703b705cfSriastradh} 239803b705cfSriastradh 23999a906b70Schristosbool kgem_check_surface_size(struct kgem *kgem, 24009a906b70Schristos uint32_t width, 24019a906b70Schristos uint32_t height, 24029a906b70Schristos uint32_t bpp, 24039a906b70Schristos uint32_t tiling, 24049a906b70Schristos uint32_t pitch, 24059a906b70Schristos uint32_t size) 24069a906b70Schristos{ 24079a906b70Schristos uint32_t min_size, min_pitch; 24089a906b70Schristos int tile_width, tile_height, tile_size; 24099a906b70Schristos 24109a906b70Schristos DBG(("%s(width=%d, height=%d, bpp=%d, tiling=%d, pitch=%d, size=%d)\n", 24119a906b70Schristos __FUNCTION__, width, height, bpp, tiling, pitch, size)); 24129a906b70Schristos 24139a906b70Schristos if (pitch & 3) 24149a906b70Schristos return false; 24159a906b70Schristos 24169a906b70Schristos min_size = kgem_surface_size(kgem, kgem->has_relaxed_fencing, 0, 24179a906b70Schristos width, height, bpp, tiling, 24189a906b70Schristos &min_pitch); 24199a906b70Schristos 24209a906b70Schristos DBG(("%s: min_pitch=%d, min_size=%d\n", __FUNCTION__, min_pitch, min_size)); 24219a906b70Schristos 24229a906b70Schristos if (size < min_size) 24239a906b70Schristos return false; 24249a906b70Schristos 24259a906b70Schristos if (pitch < min_pitch) 24269a906b70Schristos return false; 24279a906b70Schristos 24289a906b70Schristos kgem_get_tile_size(kgem, tiling, min_pitch, 24299a906b70Schristos &tile_width, &tile_height, &tile_size); 24309a906b70Schristos 24319a906b70Schristos DBG(("%s: tile_width=%d, tile_size=%d\n", __FUNCTION__, tile_width, tile_size)); 24329a906b70Schristos if (pitch & (tile_width - 1)) 24339a906b70Schristos return false; 24349a906b70Schristos if (size & (tile_size - 1)) 24359a906b70Schristos return false; 24369a906b70Schristos 24379a906b70Schristos return true; 24389a906b70Schristos} 24399a906b70Schristos 244003b705cfSriastradhstatic uint32_t kgem_aligned_height(struct kgem *kgem, 244103b705cfSriastradh uint32_t height, uint32_t tiling) 244203b705cfSriastradh{ 244303b705cfSriastradh uint32_t tile_height; 244403b705cfSriastradh 244503b705cfSriastradh if (kgem->gen <= 030) { 24469a906b70Schristos tile_height = tiling ? kgem->gen < 030 ? 16 : 8 : 1; 244703b705cfSriastradh } else switch (tiling) { 244803b705cfSriastradh /* XXX align to an even tile row */ 244903b705cfSriastradh default: 245003b705cfSriastradh case I915_TILING_NONE: 245103b705cfSriastradh tile_height = 1; 245203b705cfSriastradh break; 245303b705cfSriastradh case I915_TILING_X: 24549a906b70Schristos tile_height = 8; 245503b705cfSriastradh break; 245603b705cfSriastradh case I915_TILING_Y: 24579a906b70Schristos tile_height = 32; 245803b705cfSriastradh break; 245903b705cfSriastradh } 246003b705cfSriastradh 24619a906b70Schristos /* XXX align to an even tile row */ 24629a906b70Schristos if (!kgem->has_relaxed_fencing) 24639a906b70Schristos tile_height *= 2; 24649a906b70Schristos 246503b705cfSriastradh return ALIGN(height, tile_height); 246603b705cfSriastradh} 246703b705cfSriastradh 246803b705cfSriastradhstatic struct drm_i915_gem_exec_object2 * 246903b705cfSriastradhkgem_add_handle(struct kgem *kgem, struct kgem_bo *bo) 247003b705cfSriastradh{ 247103b705cfSriastradh struct drm_i915_gem_exec_object2 *exec; 247203b705cfSriastradh 247303b705cfSriastradh DBG(("%s: handle=%d, index=%d\n", 247403b705cfSriastradh __FUNCTION__, bo->handle, kgem->nexec)); 247503b705cfSriastradh 247603b705cfSriastradh assert(kgem->nexec < ARRAY_SIZE(kgem->exec)); 247703b705cfSriastradh bo->target_handle = kgem->has_handle_lut ? kgem->nexec : bo->handle; 247803b705cfSriastradh exec = memset(&kgem->exec[kgem->nexec++], 0, sizeof(*exec)); 247903b705cfSriastradh exec->handle = bo->handle; 248003b705cfSriastradh exec->offset = bo->presumed_offset; 248103b705cfSriastradh 248203b705cfSriastradh kgem->aperture += num_pages(bo); 248303b705cfSriastradh 248403b705cfSriastradh return exec; 248503b705cfSriastradh} 248603b705cfSriastradh 248703b705cfSriastradhstatic void kgem_add_bo(struct kgem *kgem, struct kgem_bo *bo) 248803b705cfSriastradh{ 24899a906b70Schristos assert(bo->refcnt); 24909a906b70Schristos assert(bo->proxy == NULL); 24919a906b70Schristos 249203b705cfSriastradh bo->exec = kgem_add_handle(kgem, bo); 249303b705cfSriastradh bo->rq = MAKE_REQUEST(kgem->next_request, kgem->ring); 249403b705cfSriastradh 249503b705cfSriastradh list_move_tail(&bo->request, &kgem->next_request->buffers); 24969a906b70Schristos if (bo->io && !list_is_empty(&bo->list)) 24979a906b70Schristos list_move(&bo->list, &kgem->batch_buffers); 249803b705cfSriastradh 249903b705cfSriastradh /* XXX is it worth working around gcc here? */ 250003b705cfSriastradh kgem->flush |= bo->flush; 250103b705cfSriastradh} 250203b705cfSriastradh 250363ef14f0Smrgstatic void kgem_clear_swctrl(struct kgem *kgem) 250463ef14f0Smrg{ 250563ef14f0Smrg uint32_t *b; 250663ef14f0Smrg 250763ef14f0Smrg if (kgem->bcs_state == 0) 250863ef14f0Smrg return; 250963ef14f0Smrg 251063ef14f0Smrg DBG(("%s: clearin SWCTRL LRI from %x\n", 251163ef14f0Smrg __FUNCTION__, kgem->bcs_state)); 251263ef14f0Smrg 251363ef14f0Smrg b = kgem->batch + kgem->nbatch; 251463ef14f0Smrg kgem->nbatch += 7; 251563ef14f0Smrg 251663ef14f0Smrg *b++ = MI_FLUSH_DW; 251763ef14f0Smrg *b++ = 0; 251863ef14f0Smrg *b++ = 0; 251963ef14f0Smrg *b++ = 0; 252063ef14f0Smrg 252163ef14f0Smrg *b++ = MI_LOAD_REGISTER_IMM; 252263ef14f0Smrg *b++ = BCS_SWCTRL; 252363ef14f0Smrg *b++ = (BCS_SRC_Y | BCS_DST_Y) << 16; 252463ef14f0Smrg 252563ef14f0Smrg kgem->bcs_state = 0; 252663ef14f0Smrg} 252763ef14f0Smrg 252803b705cfSriastradhstatic uint32_t kgem_end_batch(struct kgem *kgem) 252903b705cfSriastradh{ 253063ef14f0Smrg kgem_clear_swctrl(kgem); 253103b705cfSriastradh kgem->batch[kgem->nbatch++] = MI_BATCH_BUFFER_END; 253203b705cfSriastradh if (kgem->nbatch & 1) 253303b705cfSriastradh kgem->batch[kgem->nbatch++] = MI_NOOP; 253403b705cfSriastradh 253503b705cfSriastradh return kgem->nbatch; 253603b705cfSriastradh} 253703b705cfSriastradh 253803b705cfSriastradhstatic void kgem_bo_binding_free(struct kgem *kgem, struct kgem_bo *bo) 253903b705cfSriastradh{ 254003b705cfSriastradh struct kgem_bo_binding *b; 254103b705cfSriastradh 254203b705cfSriastradh b = bo->binding.next; 254303b705cfSriastradh while (b) { 254403b705cfSriastradh struct kgem_bo_binding *next = b->next; 25459a906b70Schristos free(b); 254603b705cfSriastradh b = next; 254703b705cfSriastradh } 254803b705cfSriastradh} 254903b705cfSriastradh 255003b705cfSriastradhstatic void kgem_bo_free(struct kgem *kgem, struct kgem_bo *bo) 255103b705cfSriastradh{ 25529a906b70Schristos DBG(("%s: handle=%d, size=%d\n", __FUNCTION__, bo->handle, bytes(bo))); 255303b705cfSriastradh assert(bo->refcnt == 0); 255403b705cfSriastradh assert(bo->proxy == NULL); 255503b705cfSriastradh assert(bo->exec == NULL); 255603b705cfSriastradh assert(!bo->snoop || bo->rq == NULL); 255703b705cfSriastradh 255803b705cfSriastradh#ifdef DEBUG_MEMORY 255903b705cfSriastradh kgem->debug_memory.bo_allocs--; 256003b705cfSriastradh kgem->debug_memory.bo_bytes -= bytes(bo); 256103b705cfSriastradh#endif 256203b705cfSriastradh 256303b705cfSriastradh kgem_bo_binding_free(kgem, bo); 25649a906b70Schristos kgem_bo_rmfb(kgem, bo); 256503b705cfSriastradh 25669a906b70Schristos if (IS_USER_MAP(bo->map__cpu)) { 256703b705cfSriastradh assert(bo->rq == NULL); 256803b705cfSriastradh assert(!__kgem_busy(kgem, bo->handle)); 25699a906b70Schristos assert(MAP(bo->map__cpu) != bo || bo->io || bo->flush); 257003b705cfSriastradh if (!(bo->io || bo->flush)) { 257103b705cfSriastradh DBG(("%s: freeing snooped base\n", __FUNCTION__)); 25729a906b70Schristos assert(bo != MAP(bo->map__cpu)); 25739a906b70Schristos free(MAP(bo->map__cpu)); 257403b705cfSriastradh } 25759a906b70Schristos bo->map__cpu = NULL; 25769a906b70Schristos } 25779a906b70Schristos 25789a906b70Schristos DBG(("%s: releasing %p:%p vma for handle=%d, count=%d\n", 25799a906b70Schristos __FUNCTION__, bo->map__gtt, bo->map__cpu, 2580813957e3Ssnj bo->handle, list_is_empty(&bo->vma) ? 0 : kgem->vma[bo->map__gtt == NULL && bo->map__wc == NULL].count)); 25819a906b70Schristos 25829a906b70Schristos if (!list_is_empty(&bo->vma)) { 25839a906b70Schristos _list_del(&bo->vma); 2584813957e3Ssnj kgem->vma[bo->map__gtt == NULL && bo->map__wc == NULL].count--; 258503b705cfSriastradh } 25869a906b70Schristos 25879a906b70Schristos if (bo->map__gtt) 2588813957e3Ssnj munmap(bo->map__gtt, bytes(bo)); 2589813957e3Ssnj if (bo->map__wc) { 2590813957e3Ssnj VG(VALGRIND_MAKE_MEM_NOACCESS(bo->map__wc, bytes(bo))); 2591813957e3Ssnj munmap(bo->map__wc, bytes(bo)); 2592813957e3Ssnj } 2593813957e3Ssnj if (bo->map__cpu) { 2594813957e3Ssnj VG(VALGRIND_MAKE_MEM_NOACCESS(MAP(bo->map__cpu), bytes(bo))); 25959a906b70Schristos munmap(MAP(bo->map__cpu), bytes(bo)); 2596813957e3Ssnj } 259703b705cfSriastradh 259803b705cfSriastradh _list_del(&bo->list); 259903b705cfSriastradh _list_del(&bo->request); 260003b705cfSriastradh gem_close(kgem->fd, bo->handle); 260103b705cfSriastradh 26029a906b70Schristos if (!bo->io && !DBG_NO_MALLOC_CACHE) { 260303b705cfSriastradh *(struct kgem_bo **)bo = __kgem_freed_bo; 260403b705cfSriastradh __kgem_freed_bo = bo; 260503b705cfSriastradh } else 260603b705cfSriastradh free(bo); 260703b705cfSriastradh} 260803b705cfSriastradh 260903b705cfSriastradhinline static void kgem_bo_move_to_inactive(struct kgem *kgem, 261003b705cfSriastradh struct kgem_bo *bo) 261103b705cfSriastradh{ 261203b705cfSriastradh DBG(("%s: moving handle=%d to inactive\n", __FUNCTION__, bo->handle)); 261303b705cfSriastradh 261403b705cfSriastradh assert(bo->refcnt == 0); 261503b705cfSriastradh assert(bo->reusable); 261603b705cfSriastradh assert(bo->rq == NULL); 261703b705cfSriastradh assert(bo->exec == NULL); 261803b705cfSriastradh assert(bo->domain != DOMAIN_GPU); 261903b705cfSriastradh assert(!bo->proxy); 262003b705cfSriastradh assert(!bo->io); 262103b705cfSriastradh assert(!bo->scanout); 262203b705cfSriastradh assert(!bo->snoop); 262303b705cfSriastradh assert(!bo->flush); 262403b705cfSriastradh assert(!bo->needs_flush); 262563ef14f0Smrg assert(!bo->delta); 262603b705cfSriastradh assert(list_is_empty(&bo->vma)); 262703b705cfSriastradh assert_tiling(kgem, bo); 262863ef14f0Smrg assert_caching(kgem, bo); 262903b705cfSriastradh ASSERT_IDLE(kgem, bo->handle); 263003b705cfSriastradh 263103b705cfSriastradh if (bucket(bo) >= NUM_CACHE_BUCKETS) { 26329a906b70Schristos if (bo->map__gtt) { 263363ef14f0Smrg DBG(("%s: relinquishing large GTT mapping for handle=%d\n", 263463ef14f0Smrg __FUNCTION__, bo->handle)); 2635813957e3Ssnj munmap(bo->map__gtt, bytes(bo)); 26369a906b70Schristos bo->map__gtt = NULL; 26379a906b70Schristos } 263803b705cfSriastradh 26399a906b70Schristos list_move(&bo->list, &kgem->large_inactive); 26409a906b70Schristos } else { 26419a906b70Schristos assert(bo->flush == false); 2642813957e3Ssnj assert(list_is_empty(&bo->vma)); 26439a906b70Schristos list_move(&bo->list, &kgem->inactive[bucket(bo)]); 2644813957e3Ssnj if (bo->map__gtt && !kgem_bo_can_map(kgem, bo)) { 264563ef14f0Smrg DBG(("%s: relinquishing old GTT mapping for handle=%d\n", 264663ef14f0Smrg __FUNCTION__, bo->handle)); 2647813957e3Ssnj munmap(bo->map__gtt, bytes(bo)); 2648813957e3Ssnj bo->map__gtt = NULL; 264903b705cfSriastradh } 2650813957e3Ssnj if (bo->map__gtt || (bo->map__wc && !bo->tiling)) { 2651813957e3Ssnj list_add(&bo->vma, &kgem->vma[0].inactive[bucket(bo)]); 2652813957e3Ssnj kgem->vma[0].count++; 2653813957e3Ssnj } 2654813957e3Ssnj if (bo->map__cpu && list_is_empty(&bo->vma)) { 26559a906b70Schristos list_add(&bo->vma, &kgem->vma[1].inactive[bucket(bo)]); 26569a906b70Schristos kgem->vma[1].count++; 265703b705cfSriastradh } 265803b705cfSriastradh } 26599a906b70Schristos 26609a906b70Schristos kgem->need_expire = true; 266103b705cfSriastradh} 266203b705cfSriastradh 266303b705cfSriastradhstatic struct kgem_bo *kgem_bo_replace_io(struct kgem_bo *bo) 266403b705cfSriastradh{ 266503b705cfSriastradh struct kgem_bo *base; 266603b705cfSriastradh 266703b705cfSriastradh if (!bo->io) 266803b705cfSriastradh return bo; 266903b705cfSriastradh 267003b705cfSriastradh assert(!bo->snoop); 267163ef14f0Smrg assert(!bo->purged); 267263ef14f0Smrg assert(!bo->scanout); 267363ef14f0Smrg assert(!bo->delta); 267463ef14f0Smrg 26759a906b70Schristos if (__kgem_freed_bo) { 26769a906b70Schristos base = __kgem_freed_bo; 26779a906b70Schristos __kgem_freed_bo = *(struct kgem_bo **)base; 26789a906b70Schristos } else 26799a906b70Schristos base = malloc(sizeof(*base)); 268003b705cfSriastradh if (base) { 268103b705cfSriastradh DBG(("%s: transferring io handle=%d to bo\n", 268203b705cfSriastradh __FUNCTION__, bo->handle)); 268303b705cfSriastradh /* transfer the handle to a minimum bo */ 268403b705cfSriastradh memcpy(base, bo, sizeof(*base)); 268503b705cfSriastradh base->io = false; 268603b705cfSriastradh list_init(&base->list); 268703b705cfSriastradh list_replace(&bo->request, &base->request); 268803b705cfSriastradh list_replace(&bo->vma, &base->vma); 268903b705cfSriastradh free(bo); 269003b705cfSriastradh bo = base; 269103b705cfSriastradh } else 269203b705cfSriastradh bo->reusable = false; 269303b705cfSriastradh 269403b705cfSriastradh return bo; 269503b705cfSriastradh} 269603b705cfSriastradh 269703b705cfSriastradhinline static void kgem_bo_remove_from_inactive(struct kgem *kgem, 269803b705cfSriastradh struct kgem_bo *bo) 269903b705cfSriastradh{ 270003b705cfSriastradh DBG(("%s: removing handle=%d from inactive\n", __FUNCTION__, bo->handle)); 270103b705cfSriastradh 270203b705cfSriastradh list_del(&bo->list); 270303b705cfSriastradh assert(bo->rq == NULL); 270403b705cfSriastradh assert(bo->exec == NULL); 270563ef14f0Smrg assert(!bo->purged); 27069a906b70Schristos if (!list_is_empty(&bo->vma)) { 2707813957e3Ssnj assert(bo->map__gtt || bo->map__wc || bo->map__cpu); 270803b705cfSriastradh list_del(&bo->vma); 2709813957e3Ssnj kgem->vma[bo->map__gtt == NULL && bo->map__wc == NULL].count--; 271003b705cfSriastradh } 271103b705cfSriastradh} 271203b705cfSriastradh 271303b705cfSriastradhinline static void kgem_bo_remove_from_active(struct kgem *kgem, 271403b705cfSriastradh struct kgem_bo *bo) 271503b705cfSriastradh{ 271603b705cfSriastradh DBG(("%s: removing handle=%d from active\n", __FUNCTION__, bo->handle)); 271703b705cfSriastradh 271803b705cfSriastradh list_del(&bo->list); 271903b705cfSriastradh assert(bo->rq != NULL); 27209a906b70Schristos if (RQ(bo->rq) == (void *)kgem) { 27219a906b70Schristos assert(bo->exec == NULL); 272203b705cfSriastradh list_del(&bo->request); 27239a906b70Schristos } 272403b705cfSriastradh assert(list_is_empty(&bo->vma)); 272503b705cfSriastradh} 272603b705cfSriastradh 272703b705cfSriastradhstatic void _kgem_bo_delete_buffer(struct kgem *kgem, struct kgem_bo *bo) 272803b705cfSriastradh{ 272903b705cfSriastradh struct kgem_buffer *io = (struct kgem_buffer *)bo->proxy; 273003b705cfSriastradh 273103b705cfSriastradh DBG(("%s: size=%d, offset=%d, parent used=%d\n", 273203b705cfSriastradh __FUNCTION__, bo->size.bytes, bo->delta, io->used)); 273303b705cfSriastradh 273403b705cfSriastradh if (ALIGN(bo->delta + bo->size.bytes, UPLOAD_ALIGNMENT) == io->used) 273503b705cfSriastradh io->used = bo->delta; 273603b705cfSriastradh} 273703b705cfSriastradh 273803b705cfSriastradhstatic bool check_scanout_size(struct kgem *kgem, 273903b705cfSriastradh struct kgem_bo *bo, 274003b705cfSriastradh int width, int height) 274103b705cfSriastradh{ 274203b705cfSriastradh struct drm_mode_fb_cmd info; 274303b705cfSriastradh 274403b705cfSriastradh assert(bo->scanout); 274503b705cfSriastradh 274603b705cfSriastradh VG_CLEAR(info); 274703b705cfSriastradh info.fb_id = bo->delta; 274803b705cfSriastradh 27499a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_MODE_GETFB, &info)) 275003b705cfSriastradh return false; 275103b705cfSriastradh 275203b705cfSriastradh gem_close(kgem->fd, info.handle); 275303b705cfSriastradh 275463ef14f0Smrg if (width > info.width || height > info.height) { 275503b705cfSriastradh DBG(("%s: not using scanout %d (%dx%d), want (%dx%d)\n", 275603b705cfSriastradh __FUNCTION__, 275703b705cfSriastradh info.fb_id, info.width, info.height, 275803b705cfSriastradh width, height)); 275903b705cfSriastradh return false; 276003b705cfSriastradh } 276103b705cfSriastradh 276203b705cfSriastradh return true; 276303b705cfSriastradh} 276403b705cfSriastradh 276503b705cfSriastradhstatic void kgem_bo_move_to_scanout(struct kgem *kgem, struct kgem_bo *bo) 276603b705cfSriastradh{ 276703b705cfSriastradh assert(bo->refcnt == 0); 276803b705cfSriastradh assert(bo->scanout); 276903b705cfSriastradh assert(!bo->flush); 277003b705cfSriastradh assert(!bo->snoop); 277103b705cfSriastradh assert(!bo->io); 277203b705cfSriastradh 27739a906b70Schristos if (bo->purged) { /* for stolen fb */ 27749a906b70Schristos if (!bo->exec) { 27759a906b70Schristos DBG(("%s: discarding purged scanout - stolen?\n", 27769a906b70Schristos __FUNCTION__)); 27779a906b70Schristos kgem_bo_free(kgem, bo); 27789a906b70Schristos } 277903b705cfSriastradh return; 278003b705cfSriastradh } 278103b705cfSriastradh 278203b705cfSriastradh DBG(("%s: moving %d [fb %d] to scanout cache, active? %d\n", 278303b705cfSriastradh __FUNCTION__, bo->handle, bo->delta, bo->rq != NULL)); 278403b705cfSriastradh if (bo->rq) 278503b705cfSriastradh list_move_tail(&bo->list, &kgem->scanout); 278603b705cfSriastradh else 278703b705cfSriastradh list_move(&bo->list, &kgem->scanout); 27889a906b70Schristos 27899a906b70Schristos kgem->need_expire = true; 279003b705cfSriastradh} 279103b705cfSriastradh 279203b705cfSriastradhstatic void kgem_bo_move_to_snoop(struct kgem *kgem, struct kgem_bo *bo) 279303b705cfSriastradh{ 279403b705cfSriastradh assert(bo->reusable); 27959a906b70Schristos assert(!bo->scanout); 279603b705cfSriastradh assert(!bo->flush); 279703b705cfSriastradh assert(!bo->needs_flush); 279803b705cfSriastradh assert(bo->refcnt == 0); 279903b705cfSriastradh assert(bo->exec == NULL); 280063ef14f0Smrg assert(!bo->purged); 280163ef14f0Smrg assert(!bo->delta); 280203b705cfSriastradh 28039a906b70Schristos if (DBG_NO_SNOOP_CACHE) { 28049a906b70Schristos kgem_bo_free(kgem, bo); 28059a906b70Schristos return; 28069a906b70Schristos } 28079a906b70Schristos 280803b705cfSriastradh if (num_pages(bo) > kgem->max_cpu_size >> 13) { 280903b705cfSriastradh DBG(("%s handle=%d discarding large CPU buffer (%d >%d pages)\n", 281003b705cfSriastradh __FUNCTION__, bo->handle, num_pages(bo), kgem->max_cpu_size >> 13)); 281103b705cfSriastradh kgem_bo_free(kgem, bo); 281203b705cfSriastradh return; 281303b705cfSriastradh } 281403b705cfSriastradh 281503b705cfSriastradh assert(bo->tiling == I915_TILING_NONE); 281603b705cfSriastradh assert(bo->rq == NULL); 281703b705cfSriastradh 281803b705cfSriastradh DBG(("%s: moving %d to snoop cachee\n", __FUNCTION__, bo->handle)); 281903b705cfSriastradh list_add(&bo->list, &kgem->snoop); 28209a906b70Schristos kgem->need_expire = true; 28219a906b70Schristos} 28229a906b70Schristos 28239a906b70Schristosstatic bool kgem_bo_move_to_cache(struct kgem *kgem, struct kgem_bo *bo) 28249a906b70Schristos{ 28259a906b70Schristos bool retired = false; 28269a906b70Schristos 28279a906b70Schristos DBG(("%s: release handle=%d\n", __FUNCTION__, bo->handle)); 28289a906b70Schristos 28299a906b70Schristos if (bo->prime) { 28309a906b70Schristos DBG(("%s: discarding imported prime handle=%d\n", 28319a906b70Schristos __FUNCTION__, bo->handle)); 28329a906b70Schristos kgem_bo_free(kgem, bo); 28339a906b70Schristos } else if (bo->snoop) { 28349a906b70Schristos kgem_bo_move_to_snoop(kgem, bo); 28359a906b70Schristos } else if (bo->scanout) { 28369a906b70Schristos kgem_bo_move_to_scanout(kgem, bo); 283763ef14f0Smrg } else if ((bo = kgem_bo_replace_io(bo))->reusable) { 28389a906b70Schristos kgem_bo_move_to_inactive(kgem, bo); 28399a906b70Schristos retired = true; 28409a906b70Schristos } else 28419a906b70Schristos kgem_bo_free(kgem, bo); 28429a906b70Schristos 28439a906b70Schristos return retired; 284403b705cfSriastradh} 284503b705cfSriastradh 284603b705cfSriastradhstatic struct kgem_bo * 284703b705cfSriastradhsearch_snoop_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags) 284803b705cfSriastradh{ 284903b705cfSriastradh struct kgem_bo *bo, *first = NULL; 285003b705cfSriastradh 285103b705cfSriastradh DBG(("%s: num_pages=%d, flags=%x\n", __FUNCTION__, num_pages, flags)); 285203b705cfSriastradh 285303b705cfSriastradh if ((kgem->has_caching | kgem->has_userptr) == 0) 285403b705cfSriastradh return NULL; 285503b705cfSriastradh 285603b705cfSriastradh if (list_is_empty(&kgem->snoop)) { 285703b705cfSriastradh DBG(("%s: inactive and cache empty\n", __FUNCTION__)); 285803b705cfSriastradh if (!__kgem_throttle_retire(kgem, flags)) { 285903b705cfSriastradh DBG(("%s: nothing retired\n", __FUNCTION__)); 286003b705cfSriastradh return NULL; 286103b705cfSriastradh } 286203b705cfSriastradh } 286303b705cfSriastradh 286403b705cfSriastradh list_for_each_entry(bo, &kgem->snoop, list) { 286503b705cfSriastradh assert(bo->refcnt == 0); 286603b705cfSriastradh assert(bo->snoop); 286703b705cfSriastradh assert(!bo->scanout); 286803b705cfSriastradh assert(!bo->purged); 286903b705cfSriastradh assert(bo->proxy == NULL); 287003b705cfSriastradh assert(bo->tiling == I915_TILING_NONE); 287103b705cfSriastradh assert(bo->rq == NULL); 287203b705cfSriastradh assert(bo->exec == NULL); 287303b705cfSriastradh 287403b705cfSriastradh if (num_pages > num_pages(bo)) 287503b705cfSriastradh continue; 287603b705cfSriastradh 287703b705cfSriastradh if (num_pages(bo) > 2*num_pages) { 287803b705cfSriastradh if (first == NULL) 287903b705cfSriastradh first = bo; 288003b705cfSriastradh continue; 288103b705cfSriastradh } 288203b705cfSriastradh 288303b705cfSriastradh list_del(&bo->list); 288403b705cfSriastradh bo->pitch = 0; 288503b705cfSriastradh bo->delta = 0; 288603b705cfSriastradh 288703b705cfSriastradh DBG((" %s: found handle=%d (num_pages=%d) in snoop cache\n", 288803b705cfSriastradh __FUNCTION__, bo->handle, num_pages(bo))); 288903b705cfSriastradh return bo; 289003b705cfSriastradh } 289103b705cfSriastradh 289203b705cfSriastradh if (first) { 289303b705cfSriastradh list_del(&first->list); 289403b705cfSriastradh first->pitch = 0; 289503b705cfSriastradh first->delta = 0; 289603b705cfSriastradh 289703b705cfSriastradh DBG((" %s: found handle=%d (num_pages=%d) in snoop cache\n", 289803b705cfSriastradh __FUNCTION__, first->handle, num_pages(first))); 289903b705cfSriastradh return first; 290003b705cfSriastradh } 290103b705cfSriastradh 290203b705cfSriastradh return NULL; 290303b705cfSriastradh} 290403b705cfSriastradh 290503b705cfSriastradhvoid kgem_bo_undo(struct kgem *kgem, struct kgem_bo *bo) 290603b705cfSriastradh{ 290703b705cfSriastradh if (kgem->nexec != 1 || bo->exec == NULL) 290803b705cfSriastradh return; 290903b705cfSriastradh 29109a906b70Schristos assert(bo); 291103b705cfSriastradh DBG(("%s: only handle in batch, discarding last operations for handle=%d\n", 291203b705cfSriastradh __FUNCTION__, bo->handle)); 291303b705cfSriastradh 291463ef14f0Smrg assert(bo->exec == &_kgem_dummy_exec || bo->exec == &kgem->exec[0]); 291503b705cfSriastradh assert(kgem->exec[0].handle == bo->handle); 291603b705cfSriastradh assert(RQ(bo->rq) == kgem->next_request); 291703b705cfSriastradh 291803b705cfSriastradh bo->refcnt++; 291903b705cfSriastradh kgem_reset(kgem); 292003b705cfSriastradh bo->refcnt--; 29219a906b70Schristos 29229a906b70Schristos assert(kgem->nreloc == 0); 29239a906b70Schristos assert(kgem->nexec == 0); 29249a906b70Schristos assert(bo->exec == NULL); 292503b705cfSriastradh} 292603b705cfSriastradh 29279a906b70Schristosvoid kgem_bo_pair_undo(struct kgem *kgem, struct kgem_bo *a, struct kgem_bo *b) 292803b705cfSriastradh{ 29299a906b70Schristos if (kgem->nexec > 2) 29309a906b70Schristos return; 293103b705cfSriastradh 29329a906b70Schristos if (kgem->nexec == 1) { 29339a906b70Schristos if (a) 29349a906b70Schristos kgem_bo_undo(kgem, a); 29359a906b70Schristos if (b) 29369a906b70Schristos kgem_bo_undo(kgem, b); 29379a906b70Schristos return; 29389a906b70Schristos } 29399a906b70Schristos 29409a906b70Schristos if (a == NULL || b == NULL) 29419a906b70Schristos return; 294263ef14f0Smrg assert(a != b); 29439a906b70Schristos if (a->exec == NULL || b->exec == NULL) 29449a906b70Schristos return; 29459a906b70Schristos 294663ef14f0Smrg DBG(("%s: only handles in batch, discarding last operations for handle=%d (index=%d) and handle=%d (index=%d)\n", 294763ef14f0Smrg __FUNCTION__, 294863ef14f0Smrg a->handle, a->proxy ? -1 : a->exec - kgem->exec, 294963ef14f0Smrg b->handle, b->proxy ? -1 : b->exec - kgem->exec)); 29509a906b70Schristos 295163ef14f0Smrg assert(a->exec == &_kgem_dummy_exec || 295263ef14f0Smrg a->exec == &kgem->exec[0] || 295363ef14f0Smrg a->exec == &kgem->exec[1]); 29549a906b70Schristos assert(a->handle == kgem->exec[0].handle || a->handle == kgem->exec[1].handle); 29559a906b70Schristos assert(RQ(a->rq) == kgem->next_request); 295663ef14f0Smrg assert(b->exec == &_kgem_dummy_exec || 295763ef14f0Smrg b->exec == &kgem->exec[0] || 295863ef14f0Smrg b->exec == &kgem->exec[1]); 29599a906b70Schristos assert(b->handle == kgem->exec[0].handle || b->handle == kgem->exec[1].handle); 29609a906b70Schristos assert(RQ(b->rq) == kgem->next_request); 29619a906b70Schristos 29629a906b70Schristos a->refcnt++; 29639a906b70Schristos b->refcnt++; 29649a906b70Schristos kgem_reset(kgem); 29659a906b70Schristos b->refcnt--; 29669a906b70Schristos a->refcnt--; 29679a906b70Schristos 29689a906b70Schristos assert(kgem->nreloc == 0); 29699a906b70Schristos assert(kgem->nexec == 0); 29709a906b70Schristos assert(a->exec == NULL); 29719a906b70Schristos assert(b->exec == NULL); 29729a906b70Schristos} 29739a906b70Schristos 29749a906b70Schristosstatic void __kgem_bo_destroy(struct kgem *kgem, struct kgem_bo *bo) 29759a906b70Schristos{ 29769a906b70Schristos DBG(("%s: handle=%d, size=%d\n", __FUNCTION__, bo->handle, bytes(bo))); 29779a906b70Schristos 29789a906b70Schristos assert(list_is_empty(&bo->list)); 297963ef14f0Smrg assert(list_is_empty(&bo->vma)); 29809a906b70Schristos assert(bo->refcnt == 0); 29819a906b70Schristos assert(bo->proxy == NULL); 29829a906b70Schristos assert(bo->active_scanout == 0); 29839a906b70Schristos assert_tiling(kgem, bo); 29849a906b70Schristos 29859a906b70Schristos bo->binding.offset = 0; 298603b705cfSriastradh 298703b705cfSriastradh if (DBG_NO_CACHE) 298803b705cfSriastradh goto destroy; 298903b705cfSriastradh 29909a906b70Schristos if (bo->prime) 29919a906b70Schristos goto destroy; 29929a906b70Schristos 299303b705cfSriastradh if (bo->snoop && !bo->flush) { 299403b705cfSriastradh DBG(("%s: handle=%d is snooped\n", __FUNCTION__, bo->handle)); 299503b705cfSriastradh assert(bo->reusable); 299603b705cfSriastradh assert(list_is_empty(&bo->list)); 299703b705cfSriastradh if (bo->exec == NULL && bo->rq && !__kgem_busy(kgem, bo->handle)) 299803b705cfSriastradh __kgem_bo_clear_busy(bo); 299903b705cfSriastradh if (bo->rq == NULL) 300003b705cfSriastradh kgem_bo_move_to_snoop(kgem, bo); 300103b705cfSriastradh return; 300203b705cfSriastradh } 30039a906b70Schristos if (!IS_USER_MAP(bo->map__cpu)) 300403b705cfSriastradh bo->flush = false; 300503b705cfSriastradh 300603b705cfSriastradh if (bo->scanout) { 300703b705cfSriastradh kgem_bo_move_to_scanout(kgem, bo); 300803b705cfSriastradh return; 300903b705cfSriastradh } 301003b705cfSriastradh 301103b705cfSriastradh if (bo->io) 301203b705cfSriastradh bo = kgem_bo_replace_io(bo); 301303b705cfSriastradh if (!bo->reusable) { 301403b705cfSriastradh DBG(("%s: handle=%d, not reusable\n", 301503b705cfSriastradh __FUNCTION__, bo->handle)); 301603b705cfSriastradh goto destroy; 301703b705cfSriastradh } 301803b705cfSriastradh 301903b705cfSriastradh assert(list_is_empty(&bo->vma)); 302003b705cfSriastradh assert(list_is_empty(&bo->list)); 302103b705cfSriastradh assert(bo->flush == false); 302203b705cfSriastradh assert(bo->snoop == false); 302303b705cfSriastradh assert(bo->io == false); 302403b705cfSriastradh assert(bo->scanout == false); 302563ef14f0Smrg assert_caching(kgem, bo); 302603b705cfSriastradh 302703b705cfSriastradh kgem_bo_undo(kgem, bo); 302803b705cfSriastradh assert(bo->refcnt == 0); 302903b705cfSriastradh 303003b705cfSriastradh if (bo->rq && bo->exec == NULL && !__kgem_busy(kgem, bo->handle)) 303103b705cfSriastradh __kgem_bo_clear_busy(bo); 303203b705cfSriastradh 303303b705cfSriastradh if (bo->rq) { 303403b705cfSriastradh struct list *cache; 303503b705cfSriastradh 303603b705cfSriastradh DBG(("%s: handle=%d -> active\n", __FUNCTION__, bo->handle)); 303703b705cfSriastradh if (bucket(bo) < NUM_CACHE_BUCKETS) 303803b705cfSriastradh cache = &kgem->active[bucket(bo)][bo->tiling]; 303903b705cfSriastradh else 304003b705cfSriastradh cache = &kgem->large; 304103b705cfSriastradh list_add(&bo->list, cache); 304203b705cfSriastradh return; 304303b705cfSriastradh } 304403b705cfSriastradh 304503b705cfSriastradh assert(bo->exec == NULL); 304603b705cfSriastradh assert(list_is_empty(&bo->request)); 304703b705cfSriastradh 30489a906b70Schristos if (bo->map__cpu == NULL || bucket(bo) >= NUM_CACHE_BUCKETS) { 304903b705cfSriastradh if (!kgem->has_llc && bo->domain == DOMAIN_CPU) 305003b705cfSriastradh goto destroy; 305103b705cfSriastradh 305203b705cfSriastradh DBG(("%s: handle=%d, purged\n", 305303b705cfSriastradh __FUNCTION__, bo->handle)); 305403b705cfSriastradh } 305503b705cfSriastradh 305603b705cfSriastradh kgem_bo_move_to_inactive(kgem, bo); 305703b705cfSriastradh return; 305803b705cfSriastradh 305903b705cfSriastradhdestroy: 306003b705cfSriastradh if (!bo->exec) 306103b705cfSriastradh kgem_bo_free(kgem, bo); 306203b705cfSriastradh} 306303b705cfSriastradh 306403b705cfSriastradhstatic void kgem_bo_unref(struct kgem *kgem, struct kgem_bo *bo) 306503b705cfSriastradh{ 306603b705cfSriastradh assert(bo->refcnt); 306703b705cfSriastradh if (--bo->refcnt == 0) 306803b705cfSriastradh __kgem_bo_destroy(kgem, bo); 306903b705cfSriastradh} 307003b705cfSriastradh 307103b705cfSriastradhstatic void kgem_buffer_release(struct kgem *kgem, struct kgem_buffer *bo) 307203b705cfSriastradh{ 30739a906b70Schristos assert(bo->base.io); 307403b705cfSriastradh while (!list_is_empty(&bo->base.vma)) { 307503b705cfSriastradh struct kgem_bo *cached; 307603b705cfSriastradh 307703b705cfSriastradh cached = list_first_entry(&bo->base.vma, struct kgem_bo, vma); 307803b705cfSriastradh assert(cached->proxy == &bo->base); 30799a906b70Schristos assert(cached != &bo->base); 308003b705cfSriastradh list_del(&cached->vma); 308103b705cfSriastradh 30829a906b70Schristos assert(*(struct kgem_bo **)cached->map__gtt == cached); 30839a906b70Schristos *(struct kgem_bo **)cached->map__gtt = NULL; 30849a906b70Schristos cached->map__gtt = NULL; 308503b705cfSriastradh 308603b705cfSriastradh kgem_bo_destroy(kgem, cached); 308703b705cfSriastradh } 308803b705cfSriastradh} 308903b705cfSriastradh 30909a906b70Schristosvoid kgem_retire__buffers(struct kgem *kgem) 309103b705cfSriastradh{ 309203b705cfSriastradh while (!list_is_empty(&kgem->active_buffers)) { 309303b705cfSriastradh struct kgem_buffer *bo = 309403b705cfSriastradh list_last_entry(&kgem->active_buffers, 309503b705cfSriastradh struct kgem_buffer, 309603b705cfSriastradh base.list); 309703b705cfSriastradh 30989a906b70Schristos DBG(("%s: handle=%d, busy? %d [%d]\n", 30999a906b70Schristos __FUNCTION__, bo->base.handle, bo->base.rq != NULL, bo->base.exec != NULL)); 31009a906b70Schristos 31019a906b70Schristos assert(bo->base.exec == NULL || RQ(bo->base.rq) == kgem->next_request); 310203b705cfSriastradh if (bo->base.rq) 310303b705cfSriastradh break; 310403b705cfSriastradh 310503b705cfSriastradh DBG(("%s: releasing upload cache for handle=%d? %d\n", 310603b705cfSriastradh __FUNCTION__, bo->base.handle, !list_is_empty(&bo->base.vma))); 310703b705cfSriastradh list_del(&bo->base.list); 310803b705cfSriastradh kgem_buffer_release(kgem, bo); 310903b705cfSriastradh kgem_bo_unref(kgem, &bo->base); 311003b705cfSriastradh } 311103b705cfSriastradh} 311203b705cfSriastradh 311303b705cfSriastradhstatic bool kgem_retire__flushing(struct kgem *kgem) 311403b705cfSriastradh{ 311503b705cfSriastradh struct kgem_bo *bo, *next; 311603b705cfSriastradh bool retired = false; 311703b705cfSriastradh 311803b705cfSriastradh list_for_each_entry_safe(bo, next, &kgem->flushing, request) { 31199a906b70Schristos assert(RQ(bo->rq) == (void *)kgem); 312003b705cfSriastradh assert(bo->exec == NULL); 312103b705cfSriastradh 312203b705cfSriastradh if (__kgem_busy(kgem, bo->handle)) 312303b705cfSriastradh break; 312403b705cfSriastradh 312503b705cfSriastradh __kgem_bo_clear_busy(bo); 312603b705cfSriastradh 312703b705cfSriastradh if (bo->refcnt) 312803b705cfSriastradh continue; 312903b705cfSriastradh 31309a906b70Schristos retired |= kgem_bo_move_to_cache(kgem, bo); 313103b705cfSriastradh } 313203b705cfSriastradh#if HAS_DEBUG_FULL 313303b705cfSriastradh { 313403b705cfSriastradh int count = 0; 313503b705cfSriastradh list_for_each_entry(bo, &kgem->flushing, request) 313603b705cfSriastradh count++; 313763ef14f0Smrg DBG(("%s: %d bo on flushing list, retired? %d\n", __FUNCTION__, count, retired)); 313803b705cfSriastradh } 313903b705cfSriastradh#endif 314003b705cfSriastradh 314103b705cfSriastradh kgem->need_retire |= !list_is_empty(&kgem->flushing); 314203b705cfSriastradh 314303b705cfSriastradh return retired; 314403b705cfSriastradh} 314503b705cfSriastradh 314663ef14f0Smrgstatic bool __kgem_bo_flush(struct kgem *kgem, struct kgem_bo *bo) 314763ef14f0Smrg{ 314863ef14f0Smrg struct drm_i915_gem_busy busy; 314963ef14f0Smrg 315063ef14f0Smrg if (!bo->needs_flush) 315163ef14f0Smrg return false; 315263ef14f0Smrg 315363ef14f0Smrg bo->needs_flush = false; 315463ef14f0Smrg 315563ef14f0Smrg VG_CLEAR(busy); 315663ef14f0Smrg busy.handle = bo->handle; 315763ef14f0Smrg busy.busy = !kgem->wedged; 315863ef14f0Smrg (void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_BUSY, &busy); 315963ef14f0Smrg DBG(("%s: handle=%d, busy=%d, wedged=%d\n", 316063ef14f0Smrg __FUNCTION__, bo->handle, busy.busy, kgem->wedged)); 316163ef14f0Smrg 316263ef14f0Smrg if (busy.busy == 0) 316363ef14f0Smrg return false; 316463ef14f0Smrg 316563ef14f0Smrg DBG(("%s: moving %d to flushing\n", 316663ef14f0Smrg __FUNCTION__, bo->handle)); 316763ef14f0Smrg list_add(&bo->request, &kgem->flushing); 316863ef14f0Smrg bo->rq = MAKE_REQUEST(kgem, !!(busy.busy & ~0x1ffff)); 316963ef14f0Smrg bo->needs_flush = busy.busy & 0xffff; 317063ef14f0Smrg kgem->need_retire = true; 317163ef14f0Smrg return true; 317263ef14f0Smrg} 317363ef14f0Smrg 317403b705cfSriastradhstatic bool __kgem_retire_rq(struct kgem *kgem, struct kgem_request *rq) 317503b705cfSriastradh{ 317603b705cfSriastradh bool retired = false; 317703b705cfSriastradh 317803b705cfSriastradh DBG(("%s: request %d complete\n", 317903b705cfSriastradh __FUNCTION__, rq->bo->handle)); 31809a906b70Schristos assert(RQ(rq->bo->rq) == rq); 318163ef14f0Smrg assert(rq != (struct kgem_request *)kgem); 318263ef14f0Smrg assert(rq != &kgem->static_request); 318303b705cfSriastradh 3184813957e3Ssnj if (rq == kgem->fence[rq->ring]) 3185813957e3Ssnj kgem->fence[rq->ring] = NULL; 3186813957e3Ssnj 318703b705cfSriastradh while (!list_is_empty(&rq->buffers)) { 318803b705cfSriastradh struct kgem_bo *bo; 318903b705cfSriastradh 319003b705cfSriastradh bo = list_first_entry(&rq->buffers, 319103b705cfSriastradh struct kgem_bo, 319203b705cfSriastradh request); 319303b705cfSriastradh 319403b705cfSriastradh assert(RQ(bo->rq) == rq); 319503b705cfSriastradh assert(bo->exec == NULL); 319603b705cfSriastradh assert(bo->domain == DOMAIN_GPU || bo->domain == DOMAIN_NONE); 319703b705cfSriastradh 319803b705cfSriastradh list_del(&bo->request); 319903b705cfSriastradh 320063ef14f0Smrg if (unlikely(__kgem_bo_flush(kgem, bo))) { 320163ef14f0Smrg assert(bo != rq->bo); 320263ef14f0Smrg DBG(("%s: movied %d to flushing\n", 320303b705cfSriastradh __FUNCTION__, bo->handle)); 320403b705cfSriastradh continue; 320503b705cfSriastradh } 320603b705cfSriastradh 320703b705cfSriastradh bo->domain = DOMAIN_NONE; 320803b705cfSriastradh bo->rq = NULL; 320903b705cfSriastradh if (bo->refcnt) 321003b705cfSriastradh continue; 321103b705cfSriastradh 32129a906b70Schristos retired |= kgem_bo_move_to_cache(kgem, bo); 321303b705cfSriastradh } 321403b705cfSriastradh 321503b705cfSriastradh assert(rq->bo->rq == NULL); 32169a906b70Schristos assert(rq->bo->exec == NULL); 321703b705cfSriastradh assert(list_is_empty(&rq->bo->request)); 32189a906b70Schristos assert(rq->bo->refcnt > 0); 321903b705cfSriastradh 322003b705cfSriastradh if (--rq->bo->refcnt == 0) { 322163ef14f0Smrg kgem_bo_move_to_inactive(kgem, rq->bo); 322263ef14f0Smrg retired = true; 322303b705cfSriastradh } 322403b705cfSriastradh 322503b705cfSriastradh __kgem_request_free(rq); 322603b705cfSriastradh return retired; 322703b705cfSriastradh} 322803b705cfSriastradh 322903b705cfSriastradhstatic bool kgem_retire__requests_ring(struct kgem *kgem, int ring) 323003b705cfSriastradh{ 323103b705cfSriastradh bool retired = false; 323203b705cfSriastradh 323363ef14f0Smrg assert(ring < ARRAY_SIZE(kgem->requests)); 323403b705cfSriastradh while (!list_is_empty(&kgem->requests[ring])) { 323503b705cfSriastradh struct kgem_request *rq; 323603b705cfSriastradh 323763ef14f0Smrg DBG(("%s: retiring ring %d\n", __FUNCTION__, ring)); 323863ef14f0Smrg 323903b705cfSriastradh rq = list_first_entry(&kgem->requests[ring], 324003b705cfSriastradh struct kgem_request, 324103b705cfSriastradh list); 32429a906b70Schristos assert(rq->ring == ring); 324363ef14f0Smrg assert(rq->bo); 324463ef14f0Smrg assert(RQ(rq->bo->rq) == rq); 324503b705cfSriastradh if (__kgem_busy(kgem, rq->bo->handle)) 324603b705cfSriastradh break; 324703b705cfSriastradh 324803b705cfSriastradh retired |= __kgem_retire_rq(kgem, rq); 324903b705cfSriastradh } 325003b705cfSriastradh 325103b705cfSriastradh#if HAS_DEBUG_FULL 325203b705cfSriastradh { 325303b705cfSriastradh struct kgem_bo *bo; 325403b705cfSriastradh int count = 0; 325503b705cfSriastradh 325603b705cfSriastradh list_for_each_entry(bo, &kgem->requests[ring], request) 325703b705cfSriastradh count++; 325803b705cfSriastradh 325903b705cfSriastradh bo = NULL; 326003b705cfSriastradh if (!list_is_empty(&kgem->requests[ring])) 326103b705cfSriastradh bo = list_first_entry(&kgem->requests[ring], 326203b705cfSriastradh struct kgem_request, 326303b705cfSriastradh list)->bo; 326403b705cfSriastradh 326563ef14f0Smrg DBG(("%s: ring=%d, %d outstanding requests, oldest=%d, retired? %d\n", 326663ef14f0Smrg __FUNCTION__, ring, count, bo ? bo->handle : 0, retired)); 326703b705cfSriastradh } 326803b705cfSriastradh#endif 326903b705cfSriastradh 327003b705cfSriastradh return retired; 327103b705cfSriastradh} 327203b705cfSriastradh 327303b705cfSriastradhstatic bool kgem_retire__requests(struct kgem *kgem) 327403b705cfSriastradh{ 327503b705cfSriastradh bool retired = false; 327603b705cfSriastradh int n; 327703b705cfSriastradh 327803b705cfSriastradh for (n = 0; n < ARRAY_SIZE(kgem->requests); n++) { 327903b705cfSriastradh retired |= kgem_retire__requests_ring(kgem, n); 328003b705cfSriastradh kgem->need_retire |= !list_is_empty(&kgem->requests[n]); 328103b705cfSriastradh } 328203b705cfSriastradh 328303b705cfSriastradh return retired; 328403b705cfSriastradh} 328503b705cfSriastradh 328603b705cfSriastradhbool kgem_retire(struct kgem *kgem) 328703b705cfSriastradh{ 328803b705cfSriastradh bool retired = false; 328903b705cfSriastradh 32909a906b70Schristos DBG(("%s, need_retire?=%d\n", __FUNCTION__, kgem->need_retire)); 329103b705cfSriastradh 329203b705cfSriastradh kgem->need_retire = false; 329303b705cfSriastradh 329403b705cfSriastradh retired |= kgem_retire__flushing(kgem); 329503b705cfSriastradh retired |= kgem_retire__requests(kgem); 329603b705cfSriastradh 329703b705cfSriastradh DBG(("%s -- retired=%d, need_retire=%d\n", 329803b705cfSriastradh __FUNCTION__, retired, kgem->need_retire)); 329903b705cfSriastradh 330003b705cfSriastradh kgem->retire(kgem); 330103b705cfSriastradh 330203b705cfSriastradh return retired; 330303b705cfSriastradh} 330403b705cfSriastradh 330503b705cfSriastradhbool __kgem_ring_is_idle(struct kgem *kgem, int ring) 330603b705cfSriastradh{ 330703b705cfSriastradh struct kgem_request *rq; 330803b705cfSriastradh 33099a906b70Schristos assert(ring < ARRAY_SIZE(kgem->requests)); 331003b705cfSriastradh assert(!list_is_empty(&kgem->requests[ring])); 331103b705cfSriastradh 3312813957e3Ssnj rq = kgem->fence[ring]; 3313813957e3Ssnj if (rq) { 3314813957e3Ssnj struct kgem_request *tmp; 3315813957e3Ssnj 3316813957e3Ssnj if (__kgem_busy(kgem, rq->bo->handle)) { 3317813957e3Ssnj DBG(("%s: last fence handle=%d still busy\n", 3318813957e3Ssnj __FUNCTION__, rq->bo->handle)); 3319813957e3Ssnj return false; 3320813957e3Ssnj } 3321813957e3Ssnj 3322813957e3Ssnj do { 3323813957e3Ssnj tmp = list_first_entry(&kgem->requests[ring], 3324813957e3Ssnj struct kgem_request, 3325813957e3Ssnj list); 3326813957e3Ssnj assert(tmp->ring == ring); 3327813957e3Ssnj __kgem_retire_rq(kgem, tmp); 3328813957e3Ssnj } while (tmp != rq); 3329813957e3Ssnj 3330813957e3Ssnj assert(kgem->fence[ring] == NULL); 3331813957e3Ssnj if (list_is_empty(&kgem->requests[ring])) 3332813957e3Ssnj return true; 3333813957e3Ssnj } 3334813957e3Ssnj 333503b705cfSriastradh rq = list_last_entry(&kgem->requests[ring], 333603b705cfSriastradh struct kgem_request, list); 33379a906b70Schristos assert(rq->ring == ring); 333863ef14f0Smrg assert(rq->bo); 333963ef14f0Smrg assert(RQ(rq->bo->rq) == rq); 334003b705cfSriastradh if (__kgem_busy(kgem, rq->bo->handle)) { 334103b705cfSriastradh DBG(("%s: last requests handle=%d still busy\n", 334203b705cfSriastradh __FUNCTION__, rq->bo->handle)); 3343813957e3Ssnj kgem->fence[ring] = rq; 334403b705cfSriastradh return false; 334503b705cfSriastradh } 334603b705cfSriastradh 334703b705cfSriastradh DBG(("%s: ring=%d idle (handle=%d)\n", 334803b705cfSriastradh __FUNCTION__, ring, rq->bo->handle)); 334903b705cfSriastradh 3350813957e3Ssnj while (!list_is_empty(&kgem->requests[ring])) { 3351813957e3Ssnj rq = list_first_entry(&kgem->requests[ring], 3352813957e3Ssnj struct kgem_request, 3353813957e3Ssnj list); 3354813957e3Ssnj assert(rq->ring == ring); 3355813957e3Ssnj __kgem_retire_rq(kgem, rq); 3356813957e3Ssnj } 33579a906b70Schristos 335803b705cfSriastradh return true; 335903b705cfSriastradh} 336003b705cfSriastradh 336163ef14f0Smrgbool __kgem_retire_requests_upto(struct kgem *kgem, struct kgem_bo *bo) 3362813957e3Ssnj{ 336363ef14f0Smrg struct kgem_request * const rq = RQ(bo->rq), *tmp; 336463ef14f0Smrg struct list *requests = &kgem->requests[rq->ring]; 336563ef14f0Smrg 336663ef14f0Smrg DBG(("%s(handle=%d, ring=%d)\n", __FUNCTION__, bo->handle, rq->ring)); 3367813957e3Ssnj 3368813957e3Ssnj assert(rq != &kgem->static_request); 3369813957e3Ssnj if (rq == (struct kgem_request *)kgem) { 3370813957e3Ssnj __kgem_bo_clear_busy(bo); 337163ef14f0Smrg return false; 3372813957e3Ssnj } 3373813957e3Ssnj 337463ef14f0Smrg assert(rq->ring < ARRAY_SIZE(kgem->requests)); 3375813957e3Ssnj do { 3376813957e3Ssnj tmp = list_first_entry(requests, struct kgem_request, list); 3377813957e3Ssnj assert(tmp->ring == rq->ring); 3378813957e3Ssnj __kgem_retire_rq(kgem, tmp); 3379813957e3Ssnj } while (tmp != rq); 338063ef14f0Smrg 338163ef14f0Smrg assert(bo->needs_flush || bo->rq == NULL); 338263ef14f0Smrg assert(bo->needs_flush || list_is_empty(&bo->request)); 338363ef14f0Smrg assert(bo->needs_flush || bo->domain == DOMAIN_NONE); 338463ef14f0Smrg return bo->rq; 3385813957e3Ssnj} 3386813957e3Ssnj 33879a906b70Schristos#if 0 33889a906b70Schristosstatic void kgem_commit__check_reloc(struct kgem *kgem) 33899a906b70Schristos{ 33909a906b70Schristos struct kgem_request *rq = kgem->next_request; 33919a906b70Schristos struct kgem_bo *bo; 33929a906b70Schristos bool has_64bit = kgem->gen >= 0100; 33939a906b70Schristos int i; 33949a906b70Schristos 33959a906b70Schristos for (i = 0; i < kgem->nreloc; i++) { 33969a906b70Schristos list_for_each_entry(bo, &rq->buffers, request) { 33979a906b70Schristos if (bo->target_handle == kgem->reloc[i].target_handle) { 33989a906b70Schristos uint64_t value = 0; 33999a906b70Schristos gem_read(kgem->fd, rq->bo->handle, &value, kgem->reloc[i].offset, has_64bit ? 8 : 4); 34009a906b70Schristos assert(bo->exec->offset == -1 || value == bo->exec->offset + (int)kgem->reloc[i].delta); 34019a906b70Schristos break; 34029a906b70Schristos } 34039a906b70Schristos } 34049a906b70Schristos } 34059a906b70Schristos} 34069a906b70Schristos#else 34079a906b70Schristos#define kgem_commit__check_reloc(kgem) 34089a906b70Schristos#endif 34099a906b70Schristos 34109a906b70Schristos#ifndef NDEBUG 34119a906b70Schristosstatic void kgem_commit__check_buffers(struct kgem *kgem) 34129a906b70Schristos{ 34139a906b70Schristos struct kgem_buffer *bo; 34149a906b70Schristos 34159a906b70Schristos list_for_each_entry(bo, &kgem->active_buffers, base.list) 34169a906b70Schristos assert(bo->base.exec == NULL); 34179a906b70Schristos} 34189a906b70Schristos#else 34199a906b70Schristos#define kgem_commit__check_buffers(kgem) 34209a906b70Schristos#endif 34219a906b70Schristos 342203b705cfSriastradhstatic void kgem_commit(struct kgem *kgem) 342303b705cfSriastradh{ 342403b705cfSriastradh struct kgem_request *rq = kgem->next_request; 342503b705cfSriastradh struct kgem_bo *bo, *next; 342603b705cfSriastradh 34279a906b70Schristos kgem_commit__check_reloc(kgem); 34289a906b70Schristos 342903b705cfSriastradh list_for_each_entry_safe(bo, next, &rq->buffers, request) { 343003b705cfSriastradh assert(next->request.prev == &bo->request); 343103b705cfSriastradh 343203b705cfSriastradh DBG(("%s: release handle=%d (proxy? %d), dirty? %d flush? %d, snoop? %d -> offset=%x\n", 343303b705cfSriastradh __FUNCTION__, bo->handle, bo->proxy != NULL, 343403b705cfSriastradh bo->gpu_dirty, bo->needs_flush, bo->snoop, 343503b705cfSriastradh (unsigned)bo->exec->offset)); 343603b705cfSriastradh 343703b705cfSriastradh assert(bo->exec); 343803b705cfSriastradh assert(bo->proxy == NULL || bo->exec == &_kgem_dummy_exec); 343903b705cfSriastradh assert(RQ(bo->rq) == rq || (RQ(bo->proxy->rq) == rq)); 344003b705cfSriastradh 344103b705cfSriastradh bo->presumed_offset = bo->exec->offset; 344203b705cfSriastradh bo->exec = NULL; 344303b705cfSriastradh bo->target_handle = -1; 344403b705cfSriastradh 344503b705cfSriastradh if (!bo->refcnt && !bo->reusable) { 344603b705cfSriastradh assert(!bo->snoop); 34479a906b70Schristos assert(!bo->proxy); 344803b705cfSriastradh kgem_bo_free(kgem, bo); 344903b705cfSriastradh continue; 345003b705cfSriastradh } 345103b705cfSriastradh 345203b705cfSriastradh bo->binding.offset = 0; 345303b705cfSriastradh bo->domain = DOMAIN_GPU; 345403b705cfSriastradh bo->gpu_dirty = false; 345563ef14f0Smrg bo->gtt_dirty = false; 345603b705cfSriastradh 345703b705cfSriastradh if (bo->proxy) { 345803b705cfSriastradh /* proxies are not used for domain tracking */ 345903b705cfSriastradh __kgem_bo_clear_busy(bo); 346003b705cfSriastradh } 346103b705cfSriastradh 34629a906b70Schristos kgem->scanout_busy |= bo->scanout && bo->needs_flush; 346303b705cfSriastradh } 346403b705cfSriastradh 346503b705cfSriastradh if (rq == &kgem->static_request) { 346603b705cfSriastradh struct drm_i915_gem_set_domain set_domain; 346703b705cfSriastradh 346803b705cfSriastradh DBG(("%s: syncing due to allocation failure\n", __FUNCTION__)); 346903b705cfSriastradh 347003b705cfSriastradh VG_CLEAR(set_domain); 347103b705cfSriastradh set_domain.handle = rq->bo->handle; 347203b705cfSriastradh set_domain.read_domains = I915_GEM_DOMAIN_GTT; 347303b705cfSriastradh set_domain.write_domain = I915_GEM_DOMAIN_GTT; 34749a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) { 347503b705cfSriastradh DBG(("%s: sync: GPU hang detected\n", __FUNCTION__)); 347603b705cfSriastradh kgem_throttle(kgem); 347703b705cfSriastradh } 347803b705cfSriastradh 347963ef14f0Smrg while (!list_is_empty(&rq->buffers)) { 348063ef14f0Smrg bo = list_first_entry(&rq->buffers, 348163ef14f0Smrg struct kgem_bo, 348263ef14f0Smrg request); 348363ef14f0Smrg 348463ef14f0Smrg assert(RQ(bo->rq) == rq); 348563ef14f0Smrg assert(bo->exec == NULL); 348663ef14f0Smrg assert(bo->domain == DOMAIN_GPU); 348763ef14f0Smrg 348863ef14f0Smrg list_del(&bo->request); 348963ef14f0Smrg bo->domain = DOMAIN_NONE; 349063ef14f0Smrg bo->rq = NULL; 349163ef14f0Smrg 349263ef14f0Smrg if (bo->refcnt == 0) 349363ef14f0Smrg _kgem_bo_destroy(kgem, bo); 349463ef14f0Smrg } 349563ef14f0Smrg 349603b705cfSriastradh kgem_retire(kgem); 349703b705cfSriastradh assert(list_is_empty(&rq->buffers)); 349803b705cfSriastradh 34999a906b70Schristos assert(rq->bo->map__gtt == NULL); 3500813957e3Ssnj assert(rq->bo->map__wc == NULL); 35019a906b70Schristos assert(rq->bo->map__cpu == NULL); 350203b705cfSriastradh gem_close(kgem->fd, rq->bo->handle); 350303b705cfSriastradh kgem_cleanup_cache(kgem); 350403b705cfSriastradh } else { 350563ef14f0Smrg assert(rq != (struct kgem_request *)kgem); 35069a906b70Schristos assert(rq->ring < ARRAY_SIZE(kgem->requests)); 350763ef14f0Smrg assert(rq->bo); 350803b705cfSriastradh list_add_tail(&rq->list, &kgem->requests[rq->ring]); 350903b705cfSriastradh kgem->need_throttle = kgem->need_retire = 1; 3510813957e3Ssnj 3511813957e3Ssnj if (kgem->fence[rq->ring] == NULL && 3512813957e3Ssnj __kgem_busy(kgem, rq->bo->handle)) 3513813957e3Ssnj kgem->fence[rq->ring] = rq; 351403b705cfSriastradh } 351503b705cfSriastradh 351603b705cfSriastradh kgem->next_request = NULL; 35179a906b70Schristos 35189a906b70Schristos kgem_commit__check_buffers(kgem); 351903b705cfSriastradh} 352003b705cfSriastradh 352103b705cfSriastradhstatic void kgem_close_list(struct kgem *kgem, struct list *head) 352203b705cfSriastradh{ 352303b705cfSriastradh while (!list_is_empty(head)) 352403b705cfSriastradh kgem_bo_free(kgem, list_first_entry(head, struct kgem_bo, list)); 352503b705cfSriastradh} 352603b705cfSriastradh 352703b705cfSriastradhstatic void kgem_close_inactive(struct kgem *kgem) 352803b705cfSriastradh{ 352903b705cfSriastradh unsigned int i; 353003b705cfSriastradh 353163ef14f0Smrg for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) { 353203b705cfSriastradh kgem_close_list(kgem, &kgem->inactive[i]); 353363ef14f0Smrg assert(list_is_empty(&kgem->inactive[i])); 353463ef14f0Smrg } 353503b705cfSriastradh} 353603b705cfSriastradh 353703b705cfSriastradhstatic void kgem_finish_buffers(struct kgem *kgem) 353803b705cfSriastradh{ 353903b705cfSriastradh struct kgem_buffer *bo, *next; 354003b705cfSriastradh 354103b705cfSriastradh list_for_each_entry_safe(bo, next, &kgem->batch_buffers, base.list) { 35429a906b70Schristos DBG(("%s: buffer handle=%d, used=%d, exec?=%d, write=%d, mmapped=%s, refcnt=%d\n", 354303b705cfSriastradh __FUNCTION__, bo->base.handle, bo->used, bo->base.exec!=NULL, 35449a906b70Schristos bo->write, bo->mmapped == MMAPPED_CPU ? "cpu" : bo->mmapped == MMAPPED_GTT ? "gtt" : "no", 35459a906b70Schristos bo->base.refcnt)); 354603b705cfSriastradh 354703b705cfSriastradh assert(next->base.list.prev == &bo->base.list); 354803b705cfSriastradh assert(bo->base.io); 354903b705cfSriastradh assert(bo->base.refcnt >= 1); 355003b705cfSriastradh 35519a906b70Schristos if (bo->base.refcnt > 1 && !bo->base.exec) { 35529a906b70Schristos DBG(("%s: skipping unattached handle=%d, used=%d, refcnt=%d\n", 35539a906b70Schristos __FUNCTION__, bo->base.handle, bo->used, bo->base.refcnt)); 355403b705cfSriastradh continue; 355503b705cfSriastradh } 355603b705cfSriastradh 355703b705cfSriastradh if (!bo->write) { 355803b705cfSriastradh assert(bo->base.exec || bo->base.refcnt > 1); 355903b705cfSriastradh goto decouple; 356003b705cfSriastradh } 356103b705cfSriastradh 356203b705cfSriastradh if (bo->mmapped) { 35639a906b70Schristos uint32_t used; 356403b705cfSriastradh 356503b705cfSriastradh assert(!bo->need_io); 356603b705cfSriastradh 356703b705cfSriastradh used = ALIGN(bo->used, PAGE_SIZE); 356803b705cfSriastradh if (!DBG_NO_UPLOAD_ACTIVE && 356903b705cfSriastradh used + PAGE_SIZE <= bytes(&bo->base) && 35709a906b70Schristos (kgem->has_llc || bo->mmapped == MMAPPED_GTT || bo->base.snoop)) { 35719a906b70Schristos DBG(("%s: retaining upload buffer (%d/%d): used=%d, refcnt=%d\n", 35729a906b70Schristos __FUNCTION__, bo->used, bytes(&bo->base), used, bo->base.refcnt)); 357303b705cfSriastradh bo->used = used; 357403b705cfSriastradh list_move(&bo->base.list, 357503b705cfSriastradh &kgem->active_buffers); 35769a906b70Schristos kgem->need_retire = true; 357703b705cfSriastradh continue; 357803b705cfSriastradh } 357903b705cfSriastradh DBG(("%s: discarding mmapped buffer, used=%d, map type=%d\n", 35809a906b70Schristos __FUNCTION__, bo->used, bo->mmapped)); 358103b705cfSriastradh goto decouple; 358203b705cfSriastradh } 358303b705cfSriastradh 35849a906b70Schristos if (!bo->used || !bo->base.exec) { 358503b705cfSriastradh /* Unless we replace the handle in the execbuffer, 358603b705cfSriastradh * then this bo will become active. So decouple it 358703b705cfSriastradh * from the buffer list and track it in the normal 358803b705cfSriastradh * manner. 358903b705cfSriastradh */ 359003b705cfSriastradh goto decouple; 359103b705cfSriastradh } 359203b705cfSriastradh 359303b705cfSriastradh assert(bo->need_io); 359403b705cfSriastradh assert(bo->base.rq == MAKE_REQUEST(kgem->next_request, kgem->ring)); 359503b705cfSriastradh assert(bo->base.domain != DOMAIN_GPU); 359603b705cfSriastradh 359703b705cfSriastradh if (bo->base.refcnt == 1 && 359803b705cfSriastradh bo->base.size.pages.count > 1 && 359903b705cfSriastradh bo->used < bytes(&bo->base) / 2) { 360003b705cfSriastradh struct kgem_bo *shrink; 360103b705cfSriastradh unsigned alloc = NUM_PAGES(bo->used); 360203b705cfSriastradh 360303b705cfSriastradh shrink = search_snoop_cache(kgem, alloc, 360403b705cfSriastradh CREATE_INACTIVE | CREATE_NO_RETIRE); 360503b705cfSriastradh if (shrink) { 360603b705cfSriastradh void *map; 360703b705cfSriastradh int n; 360803b705cfSriastradh 360903b705cfSriastradh DBG(("%s: used=%d, shrinking %d to %d, handle %d to %d\n", 361003b705cfSriastradh __FUNCTION__, 361103b705cfSriastradh bo->used, bytes(&bo->base), bytes(shrink), 361203b705cfSriastradh bo->base.handle, shrink->handle)); 361303b705cfSriastradh 361403b705cfSriastradh assert(bo->used <= bytes(shrink)); 361503b705cfSriastradh map = kgem_bo_map__cpu(kgem, shrink); 361603b705cfSriastradh if (map) { 361703b705cfSriastradh memcpy(map, bo->mem, bo->used); 361803b705cfSriastradh 361903b705cfSriastradh shrink->target_handle = 362003b705cfSriastradh kgem->has_handle_lut ? bo->base.target_handle : shrink->handle; 362103b705cfSriastradh for (n = 0; n < kgem->nreloc; n++) { 362203b705cfSriastradh if (kgem->reloc[n].target_handle == bo->base.target_handle) { 362363ef14f0Smrg uint64_t addr = (int)kgem->reloc[n].delta + shrink->presumed_offset; 362463ef14f0Smrg kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0])] = addr; 362563ef14f0Smrg if (kgem->gen >= 0100) 362663ef14f0Smrg kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0]) + 1] = addr >> 32; 362763ef14f0Smrg 362803b705cfSriastradh kgem->reloc[n].target_handle = shrink->target_handle; 362903b705cfSriastradh kgem->reloc[n].presumed_offset = shrink->presumed_offset; 363003b705cfSriastradh } 363103b705cfSriastradh } 363203b705cfSriastradh 363303b705cfSriastradh bo->base.exec->handle = shrink->handle; 363403b705cfSriastradh bo->base.exec->offset = shrink->presumed_offset; 363503b705cfSriastradh shrink->exec = bo->base.exec; 363603b705cfSriastradh shrink->rq = bo->base.rq; 363703b705cfSriastradh list_replace(&bo->base.request, 363803b705cfSriastradh &shrink->request); 363903b705cfSriastradh list_init(&bo->base.request); 364003b705cfSriastradh shrink->needs_flush = bo->base.gpu_dirty; 364103b705cfSriastradh 364203b705cfSriastradh bo->base.exec = NULL; 364303b705cfSriastradh bo->base.rq = NULL; 364403b705cfSriastradh bo->base.gpu_dirty = false; 364503b705cfSriastradh bo->base.needs_flush = false; 364603b705cfSriastradh bo->used = 0; 364703b705cfSriastradh 364803b705cfSriastradh goto decouple; 364903b705cfSriastradh } 365003b705cfSriastradh 365103b705cfSriastradh __kgem_bo_destroy(kgem, shrink); 365203b705cfSriastradh } 365303b705cfSriastradh 365403b705cfSriastradh shrink = search_linear_cache(kgem, alloc, 365503b705cfSriastradh CREATE_INACTIVE | CREATE_NO_RETIRE); 365603b705cfSriastradh if (shrink) { 365703b705cfSriastradh int n; 365803b705cfSriastradh 365903b705cfSriastradh DBG(("%s: used=%d, shrinking %d to %d, handle %d to %d\n", 366003b705cfSriastradh __FUNCTION__, 366103b705cfSriastradh bo->used, bytes(&bo->base), bytes(shrink), 366203b705cfSriastradh bo->base.handle, shrink->handle)); 366303b705cfSriastradh 366403b705cfSriastradh assert(bo->used <= bytes(shrink)); 36659a906b70Schristos if (gem_write__cachealigned(kgem->fd, shrink->handle, 36669a906b70Schristos 0, bo->used, bo->mem) == 0) { 366703b705cfSriastradh shrink->target_handle = 366803b705cfSriastradh kgem->has_handle_lut ? bo->base.target_handle : shrink->handle; 366903b705cfSriastradh for (n = 0; n < kgem->nreloc; n++) { 367003b705cfSriastradh if (kgem->reloc[n].target_handle == bo->base.target_handle) { 367163ef14f0Smrg uint64_t addr = (int)kgem->reloc[n].delta + shrink->presumed_offset; 367263ef14f0Smrg kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0])] = addr; 367363ef14f0Smrg if (kgem->gen >= 0100) 367463ef14f0Smrg kgem->batch[kgem->reloc[n].offset/sizeof(kgem->batch[0]) + 1] = addr >> 32; 367563ef14f0Smrg 367603b705cfSriastradh kgem->reloc[n].target_handle = shrink->target_handle; 367703b705cfSriastradh kgem->reloc[n].presumed_offset = shrink->presumed_offset; 367803b705cfSriastradh } 367903b705cfSriastradh } 368003b705cfSriastradh 368103b705cfSriastradh bo->base.exec->handle = shrink->handle; 368203b705cfSriastradh bo->base.exec->offset = shrink->presumed_offset; 368303b705cfSriastradh shrink->exec = bo->base.exec; 368403b705cfSriastradh shrink->rq = bo->base.rq; 368503b705cfSriastradh list_replace(&bo->base.request, 368603b705cfSriastradh &shrink->request); 368703b705cfSriastradh list_init(&bo->base.request); 368803b705cfSriastradh shrink->needs_flush = bo->base.gpu_dirty; 368903b705cfSriastradh 369003b705cfSriastradh bo->base.exec = NULL; 369103b705cfSriastradh bo->base.rq = NULL; 369203b705cfSriastradh bo->base.gpu_dirty = false; 369303b705cfSriastradh bo->base.needs_flush = false; 369403b705cfSriastradh bo->used = 0; 369503b705cfSriastradh 369603b705cfSriastradh goto decouple; 369703b705cfSriastradh } 369803b705cfSriastradh 369903b705cfSriastradh __kgem_bo_destroy(kgem, shrink); 370003b705cfSriastradh } 370103b705cfSriastradh } 370203b705cfSriastradh 370303b705cfSriastradh DBG(("%s: handle=%d, uploading %d/%d\n", 370403b705cfSriastradh __FUNCTION__, bo->base.handle, bo->used, bytes(&bo->base))); 370503b705cfSriastradh ASSERT_IDLE(kgem, bo->base.handle); 370603b705cfSriastradh assert(bo->used <= bytes(&bo->base)); 37079a906b70Schristos gem_write__cachealigned(kgem->fd, bo->base.handle, 37089a906b70Schristos 0, bo->used, bo->mem); 370903b705cfSriastradh bo->need_io = 0; 371003b705cfSriastradh 371103b705cfSriastradhdecouple: 371203b705cfSriastradh DBG(("%s: releasing handle=%d\n", 371303b705cfSriastradh __FUNCTION__, bo->base.handle)); 371403b705cfSriastradh list_del(&bo->base.list); 371503b705cfSriastradh kgem_bo_unref(kgem, &bo->base); 371603b705cfSriastradh } 371703b705cfSriastradh} 371803b705cfSriastradh 371903b705cfSriastradhstatic void kgem_cleanup(struct kgem *kgem) 372003b705cfSriastradh{ 372103b705cfSriastradh int n; 372203b705cfSriastradh 372303b705cfSriastradh for (n = 0; n < ARRAY_SIZE(kgem->requests); n++) { 372403b705cfSriastradh while (!list_is_empty(&kgem->requests[n])) { 372503b705cfSriastradh struct kgem_request *rq; 372603b705cfSriastradh 372703b705cfSriastradh rq = list_first_entry(&kgem->requests[n], 372803b705cfSriastradh struct kgem_request, 372903b705cfSriastradh list); 37309a906b70Schristos assert(rq->ring == n); 373103b705cfSriastradh while (!list_is_empty(&rq->buffers)) { 373203b705cfSriastradh struct kgem_bo *bo; 373303b705cfSriastradh 373403b705cfSriastradh bo = list_first_entry(&rq->buffers, 373503b705cfSriastradh struct kgem_bo, 373603b705cfSriastradh request); 373703b705cfSriastradh 373803b705cfSriastradh bo->exec = NULL; 373903b705cfSriastradh bo->gpu_dirty = false; 374003b705cfSriastradh __kgem_bo_clear_busy(bo); 374103b705cfSriastradh if (bo->refcnt == 0) 374203b705cfSriastradh kgem_bo_free(kgem, bo); 374303b705cfSriastradh } 374403b705cfSriastradh 374563ef14f0Smrg if (--rq->bo->refcnt == 0) 374663ef14f0Smrg kgem_bo_free(kgem, rq->bo); 374763ef14f0Smrg 374803b705cfSriastradh __kgem_request_free(rq); 374903b705cfSriastradh } 375003b705cfSriastradh } 375103b705cfSriastradh 375203b705cfSriastradh kgem_close_inactive(kgem); 375303b705cfSriastradh} 375403b705cfSriastradh 3755813957e3Ssnjstatic int 3756813957e3Ssnjkgem_batch_write(struct kgem *kgem, 3757813957e3Ssnj struct kgem_bo *bo, 3758813957e3Ssnj uint32_t size) 375903b705cfSriastradh{ 3760813957e3Ssnj char *ptr; 376103b705cfSriastradh int ret; 376203b705cfSriastradh 376363ef14f0Smrg assert(bo->exec == NULL); 376463ef14f0Smrg assert(bo->rq == NULL); 376563ef14f0Smrg assert(!__kgem_busy(kgem, bo->handle)); 376603b705cfSriastradh 37679a906b70Schristos#if DBG_NO_EXEC 37689a906b70Schristos { 37699a906b70Schristos uint32_t batch[] = { MI_BATCH_BUFFER_END, 0}; 3770813957e3Ssnj return gem_write(kgem->fd, bo->handle, 0, sizeof(batch), batch); 37719a906b70Schristos } 37729a906b70Schristos#endif 37739a906b70Schristos 3774813957e3Ssnj assert(!bo->scanout); 37759a906b70Schristosretry: 3776813957e3Ssnj ptr = NULL; 3777813957e3Ssnj if (bo->domain == DOMAIN_CPU || kgem->has_llc) { 3778813957e3Ssnj ptr = bo->map__cpu; 3779813957e3Ssnj if (ptr == NULL) 3780813957e3Ssnj ptr = __kgem_bo_map__cpu(kgem, bo); 3781813957e3Ssnj } else if (kgem->has_wc_mmap) { 3782813957e3Ssnj ptr = bo->map__wc; 3783813957e3Ssnj if (ptr == NULL) 3784813957e3Ssnj ptr = __kgem_bo_map__wc(kgem, bo); 3785813957e3Ssnj } 3786813957e3Ssnj if (ptr) { 3787813957e3Ssnj memcpy(ptr, kgem->batch, sizeof(uint32_t)*kgem->nbatch); 3788813957e3Ssnj if (kgem->surface != kgem->batch_size) { 3789813957e3Ssnj ret = PAGE_ALIGN(sizeof(uint32_t) * kgem->batch_size); 3790813957e3Ssnj ret -= sizeof(uint32_t) * kgem->surface; 3791813957e3Ssnj ptr += size - ret; 3792813957e3Ssnj memcpy(ptr, kgem->batch + kgem->surface, 3793813957e3Ssnj (kgem->batch_size - kgem->surface)*sizeof(uint32_t)); 3794813957e3Ssnj } 3795813957e3Ssnj return 0; 3796813957e3Ssnj } 3797813957e3Ssnj 379803b705cfSriastradh /* If there is no surface data, just upload the batch */ 37999a906b70Schristos if (kgem->surface == kgem->batch_size) { 3800813957e3Ssnj if ((ret = gem_write__cachealigned(kgem->fd, bo->handle, 38019a906b70Schristos 0, sizeof(uint32_t)*kgem->nbatch, 38029a906b70Schristos kgem->batch)) == 0) 38039a906b70Schristos return 0; 38049a906b70Schristos 38059a906b70Schristos goto expire; 38069a906b70Schristos } 380703b705cfSriastradh 380803b705cfSriastradh /* Are the batch pages conjoint with the surface pages? */ 380903b705cfSriastradh if (kgem->surface < kgem->nbatch + PAGE_SIZE/sizeof(uint32_t)) { 381003b705cfSriastradh assert(size == PAGE_ALIGN(kgem->batch_size*sizeof(uint32_t))); 3811813957e3Ssnj if ((ret = gem_write__cachealigned(kgem->fd, bo->handle, 38129a906b70Schristos 0, kgem->batch_size*sizeof(uint32_t), 38139a906b70Schristos kgem->batch)) == 0) 38149a906b70Schristos return 0; 38159a906b70Schristos 38169a906b70Schristos goto expire; 381703b705cfSriastradh } 381803b705cfSriastradh 381903b705cfSriastradh /* Disjoint surface/batch, upload separately */ 3820813957e3Ssnj if ((ret = gem_write__cachealigned(kgem->fd, bo->handle, 38219a906b70Schristos 0, sizeof(uint32_t)*kgem->nbatch, 38229a906b70Schristos kgem->batch))) 38239a906b70Schristos goto expire; 382403b705cfSriastradh 382503b705cfSriastradh ret = PAGE_ALIGN(sizeof(uint32_t) * kgem->batch_size); 382603b705cfSriastradh ret -= sizeof(uint32_t) * kgem->surface; 382703b705cfSriastradh assert(size-ret >= kgem->nbatch*sizeof(uint32_t)); 3828813957e3Ssnj if (gem_write(kgem->fd, bo->handle, 38299a906b70Schristos size - ret, (kgem->batch_size - kgem->surface)*sizeof(uint32_t), 38309a906b70Schristos kgem->batch + kgem->surface)) 38319a906b70Schristos goto expire; 38329a906b70Schristos 38339a906b70Schristos return 0; 38349a906b70Schristos 38359a906b70Schristosexpire: 38369a906b70Schristos assert(ret != EINVAL); 38379a906b70Schristos 38389a906b70Schristos (void)__kgem_throttle_retire(kgem, 0); 38399a906b70Schristos if (kgem_expire_cache(kgem)) 38409a906b70Schristos goto retry; 38419a906b70Schristos 38429a906b70Schristos if (kgem_cleanup_cache(kgem)) 38439a906b70Schristos goto retry; 38449a906b70Schristos 38459a906b70Schristos ERR(("%s: failed to write batch (handle=%d): %d\n", 3846813957e3Ssnj __FUNCTION__, bo->handle, -ret)); 38479a906b70Schristos return ret; 384803b705cfSriastradh} 384903b705cfSriastradh 385003b705cfSriastradhvoid kgem_reset(struct kgem *kgem) 385103b705cfSriastradh{ 385203b705cfSriastradh if (kgem->next_request) { 385303b705cfSriastradh struct kgem_request *rq = kgem->next_request; 385403b705cfSriastradh 385503b705cfSriastradh while (!list_is_empty(&rq->buffers)) { 385603b705cfSriastradh struct kgem_bo *bo = 385703b705cfSriastradh list_first_entry(&rq->buffers, 385803b705cfSriastradh struct kgem_bo, 385903b705cfSriastradh request); 386003b705cfSriastradh list_del(&bo->request); 386103b705cfSriastradh 386203b705cfSriastradh assert(RQ(bo->rq) == rq); 386303b705cfSriastradh 386403b705cfSriastradh bo->binding.offset = 0; 386503b705cfSriastradh bo->exec = NULL; 386603b705cfSriastradh bo->target_handle = -1; 386703b705cfSriastradh bo->gpu_dirty = false; 386803b705cfSriastradh 386903b705cfSriastradh if (bo->needs_flush && __kgem_busy(kgem, bo->handle)) { 387003b705cfSriastradh assert(bo->domain == DOMAIN_GPU || bo->domain == DOMAIN_NONE); 387103b705cfSriastradh list_add(&bo->request, &kgem->flushing); 387203b705cfSriastradh bo->rq = (void *)kgem; 38739a906b70Schristos kgem->need_retire = true; 387403b705cfSriastradh } else 387503b705cfSriastradh __kgem_bo_clear_busy(bo); 387603b705cfSriastradh 387703b705cfSriastradh if (bo->refcnt || bo->rq) 387803b705cfSriastradh continue; 387903b705cfSriastradh 38809a906b70Schristos kgem_bo_move_to_cache(kgem, bo); 388103b705cfSriastradh } 388203b705cfSriastradh 388303b705cfSriastradh if (rq != &kgem->static_request) { 388403b705cfSriastradh list_init(&rq->list); 388503b705cfSriastradh __kgem_request_free(rq); 388603b705cfSriastradh } 388703b705cfSriastradh } 388803b705cfSriastradh 388903b705cfSriastradh kgem->nfence = 0; 389003b705cfSriastradh kgem->nexec = 0; 389103b705cfSriastradh kgem->nreloc = 0; 389203b705cfSriastradh kgem->nreloc__self = 0; 389303b705cfSriastradh kgem->aperture = 0; 389403b705cfSriastradh kgem->aperture_fenced = 0; 38959a906b70Schristos kgem->aperture_max_fence = 0; 389603b705cfSriastradh kgem->nbatch = 0; 389703b705cfSriastradh kgem->surface = kgem->batch_size; 389803b705cfSriastradh kgem->mode = KGEM_NONE; 38999a906b70Schristos kgem->needs_semaphore = false; 39009a906b70Schristos kgem->needs_reservation = false; 390103b705cfSriastradh kgem->flush = 0; 390203b705cfSriastradh kgem->batch_flags = kgem->batch_flags_base; 3903813957e3Ssnj assert(kgem->batch); 390403b705cfSriastradh 390503b705cfSriastradh kgem->next_request = __kgem_request_alloc(kgem); 390603b705cfSriastradh 390703b705cfSriastradh kgem_sna_reset(kgem); 390803b705cfSriastradh} 390903b705cfSriastradh 3910813957e3Ssnjstatic int compact_batch_surface(struct kgem *kgem, int *shrink) 391103b705cfSriastradh{ 3912813957e3Ssnj int size, n; 391303b705cfSriastradh 391403b705cfSriastradh if (!kgem->has_relaxed_delta) 39159a906b70Schristos return kgem->batch_size * sizeof(uint32_t); 391603b705cfSriastradh 391703b705cfSriastradh /* See if we can pack the contents into one or two pages */ 391803b705cfSriastradh n = ALIGN(kgem->batch_size, 1024); 391903b705cfSriastradh size = n - kgem->surface + kgem->nbatch; 392003b705cfSriastradh size = ALIGN(size, 1024); 392103b705cfSriastradh 3922813957e3Ssnj *shrink = (n - size) * sizeof(uint32_t); 392303b705cfSriastradh return size * sizeof(uint32_t); 392403b705cfSriastradh} 392503b705cfSriastradh 392663ef14f0Smrgstatic struct kgem_bo *first_available(struct kgem *kgem, struct list *list) 392763ef14f0Smrg{ 392863ef14f0Smrg struct kgem_bo *bo; 392963ef14f0Smrg 393063ef14f0Smrg list_for_each_entry(bo, list, list) { 393163ef14f0Smrg assert(bo->refcnt > 0); 393263ef14f0Smrg 393363ef14f0Smrg if (bo->rq) { 393463ef14f0Smrg assert(RQ(bo->rq)->bo == bo); 393563ef14f0Smrg if (__kgem_busy(kgem, bo->handle)) 393663ef14f0Smrg break; 393763ef14f0Smrg 393863ef14f0Smrg __kgem_retire_rq(kgem, RQ(bo->rq)); 393963ef14f0Smrg assert(bo->rq == NULL); 394063ef14f0Smrg } 394163ef14f0Smrg 394263ef14f0Smrg if (bo->refcnt > 1) 394363ef14f0Smrg continue; 394463ef14f0Smrg 394563ef14f0Smrg list_move_tail(&bo->list, list); 394663ef14f0Smrg return kgem_bo_reference(bo); 394763ef14f0Smrg } 394863ef14f0Smrg 394963ef14f0Smrg return NULL; 395063ef14f0Smrg} 395163ef14f0Smrg 395203b705cfSriastradhstatic struct kgem_bo * 3953813957e3Ssnjkgem_create_batch(struct kgem *kgem) 395403b705cfSriastradh{ 395503b705cfSriastradh struct kgem_bo *bo; 395663ef14f0Smrg int size, shrink = 0; 3957813957e3Ssnj 395863ef14f0Smrg#if !DBG_NO_SHRINK_BATCHES 3959813957e3Ssnj if (kgem->surface != kgem->batch_size) 3960813957e3Ssnj size = compact_batch_surface(kgem, &shrink); 3961813957e3Ssnj else 3962813957e3Ssnj size = kgem->nbatch * sizeof(uint32_t); 396303b705cfSriastradh 396403b705cfSriastradh if (size <= 4096) { 396563ef14f0Smrg bo = first_available(kgem, &kgem->pinned_batches[0]); 396663ef14f0Smrg if (bo) 3967813957e3Ssnj goto write; 396863ef14f0Smrg } 396903b705cfSriastradh 397063ef14f0Smrg if (size <= 16384) { 397163ef14f0Smrg bo = first_available(kgem, &kgem->pinned_batches[1]); 397263ef14f0Smrg if (bo) 397363ef14f0Smrg goto write; 397403b705cfSriastradh } 397503b705cfSriastradh 39769a906b70Schristos if (kgem->gen == 020) { 39779a906b70Schristos bo = kgem_create_linear(kgem, size, CREATE_CACHED | CREATE_TEMPORARY); 39789a906b70Schristos if (bo) 3979813957e3Ssnj goto write; 398003b705cfSriastradh 39819a906b70Schristos /* Nothing available for reuse, rely on the kernel wa */ 39829a906b70Schristos if (kgem->has_pinned_batches) { 39839a906b70Schristos bo = kgem_create_linear(kgem, size, CREATE_CACHED | CREATE_TEMPORARY); 39849a906b70Schristos if (bo) { 39859a906b70Schristos kgem->batch_flags &= ~LOCAL_I915_EXEC_IS_PINNED; 3986813957e3Ssnj goto write; 39879a906b70Schristos } 39889a906b70Schristos } 39899a906b70Schristos 39909a906b70Schristos if (size < 16384) { 39919a906b70Schristos bo = list_first_entry(&kgem->pinned_batches[size > 4096], 39929a906b70Schristos struct kgem_bo, 39939a906b70Schristos list); 39949a906b70Schristos list_move_tail(&bo->list, &kgem->pinned_batches[size > 4096]); 399503b705cfSriastradh 39969a906b70Schristos DBG(("%s: syncing due to busy batches\n", __FUNCTION__)); 399763ef14f0Smrg if (kgem_bo_wait(kgem, bo)) 39989a906b70Schristos return NULL; 399903b705cfSriastradh 40009a906b70Schristos kgem_retire(kgem); 40019a906b70Schristos assert(bo->rq == NULL); 4002813957e3Ssnj bo = kgem_bo_reference(bo); 4003813957e3Ssnj goto write; 40049a906b70Schristos } 400503b705cfSriastradh } 400663ef14f0Smrg#else 400763ef14f0Smrg if (kgem->surface != kgem->batch_size) 400863ef14f0Smrg size = kgem->batch_size * sizeof(uint32_t); 400963ef14f0Smrg else 401063ef14f0Smrg size = kgem->nbatch * sizeof(uint32_t); 401163ef14f0Smrg#endif 401203b705cfSriastradh 401363ef14f0Smrg if (!kgem->batch_bo || !kgem->has_llc) { 4014813957e3Ssnj bo = kgem_create_linear(kgem, size, CREATE_NO_THROTTLE); 4015813957e3Ssnj if (bo) { 4016813957e3Ssnjwrite: 4017813957e3Ssnj kgem_fixup_relocs(kgem, bo, shrink); 4018813957e3Ssnj if (kgem_batch_write(kgem, bo, size)) { 4019813957e3Ssnj kgem_bo_destroy(kgem, bo); 4020813957e3Ssnj return NULL; 4021813957e3Ssnj } 402263ef14f0Smrg return bo; 4023813957e3Ssnj } 4024813957e3Ssnj } 402563ef14f0Smrg 4026813957e3Ssnj return kgem_new_batch(kgem); 402703b705cfSriastradh} 402803b705cfSriastradh 40299a906b70Schristos#if !NDEBUG 40309a906b70Schristosstatic bool dump_file(const char *path) 40319a906b70Schristos{ 40329a906b70Schristos FILE *file; 40339a906b70Schristos size_t len = 0; 40349a906b70Schristos char *line = NULL; 40359a906b70Schristos 40369a906b70Schristos file = fopen(path, "r"); 40379a906b70Schristos if (file == NULL) 40389a906b70Schristos return false; 40399a906b70Schristos 40409a906b70Schristos while (getline(&line, &len, file) != -1) 40419a906b70Schristos ErrorF("%s", line); 40429a906b70Schristos 40439a906b70Schristos free(line); 40449a906b70Schristos fclose(file); 40459a906b70Schristos return true; 40469a906b70Schristos} 40479a906b70Schristos 40489a906b70Schristosstatic void dump_debugfs(struct kgem *kgem, const char *name) 40499a906b70Schristos{ 40509a906b70Schristos char path[80]; 40519a906b70Schristos int minor = kgem_get_minor(kgem); 40529a906b70Schristos 40539a906b70Schristos if (minor < 0) 40549a906b70Schristos return; 40559a906b70Schristos 40569a906b70Schristos sprintf(path, "/sys/kernel/debug/dri/%d/%s", minor, name); 40579a906b70Schristos if (dump_file(path)) 40589a906b70Schristos return; 40599a906b70Schristos 40609a906b70Schristos sprintf(path, "/debug/dri/%d/%s", minor, name); 40619a906b70Schristos if (dump_file(path)) 40629a906b70Schristos return; 40639a906b70Schristos} 40649a906b70Schristos 40659a906b70Schristosstatic void dump_gtt_info(struct kgem *kgem) 40669a906b70Schristos{ 40679a906b70Schristos dump_debugfs(kgem, "i915_gem_gtt"); 40689a906b70Schristos} 40699a906b70Schristos 40709a906b70Schristosstatic void dump_fence_regs(struct kgem *kgem) 40719a906b70Schristos{ 40729a906b70Schristos dump_debugfs(kgem, "i915_gem_fence_regs"); 40739a906b70Schristos} 40749a906b70Schristos#endif 40759a906b70Schristos 40769a906b70Schristosstatic int do_execbuf(struct kgem *kgem, struct drm_i915_gem_execbuffer2 *execbuf) 40779a906b70Schristos{ 407863ef14f0Smrg int ret; 40799a906b70Schristos 40809a906b70Schristosretry: 40819a906b70Schristos ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_EXECBUFFER2, execbuf); 40829a906b70Schristos if (ret == 0) 40839a906b70Schristos return 0; 40849a906b70Schristos 40859a906b70Schristos DBG(("%s: failed ret=%d, throttling and discarding cache\n", __FUNCTION__, ret)); 40869a906b70Schristos (void)__kgem_throttle_retire(kgem, 0); 40879a906b70Schristos if (kgem_expire_cache(kgem)) 40889a906b70Schristos goto retry; 40899a906b70Schristos 40909a906b70Schristos if (kgem_cleanup_cache(kgem)) 40919a906b70Schristos goto retry; 40929a906b70Schristos 40939a906b70Schristos /* last gasp */ 4094813957e3Ssnj ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_EXECBUFFER2, execbuf); 409563ef14f0Smrg if (ret != -ENOSPC) 409663ef14f0Smrg return ret; 409763ef14f0Smrg 409863ef14f0Smrg /* One final trick up our sleeve for when we run out of space. 409963ef14f0Smrg * We turn everything off to free up our pinned framebuffers, 410063ef14f0Smrg * sprites and cursors, and try just one more time. 410163ef14f0Smrg */ 4102813957e3Ssnj 4103813957e3Ssnj xf86DrvMsg(kgem_get_screen_index(kgem), X_WARNING, 4104813957e3Ssnj "Failed to submit rendering commands, trying again with outputs disabled.\n"); 4105813957e3Ssnj 410663ef14f0Smrg if (sna_mode_disable(__to_sna(kgem))) { 4107813957e3Ssnj kgem_cleanup_cache(kgem); 4108813957e3Ssnj ret = do_ioctl(kgem->fd, 4109813957e3Ssnj DRM_IOCTL_I915_GEM_EXECBUFFER2, 4110813957e3Ssnj execbuf); 4111813957e3Ssnj DBG(("%s: last_gasp ret=%d\n", __FUNCTION__, ret)); 411263ef14f0Smrg sna_mode_enable(__to_sna(kgem)); 4113813957e3Ssnj } 4114813957e3Ssnj 4115813957e3Ssnj return ret; 41169a906b70Schristos} 41179a906b70Schristos 411803b705cfSriastradhvoid _kgem_submit(struct kgem *kgem) 411903b705cfSriastradh{ 412003b705cfSriastradh struct kgem_request *rq; 412103b705cfSriastradh uint32_t batch_end; 412263ef14f0Smrg int i, ret; 412303b705cfSriastradh 412403b705cfSriastradh assert(!DBG_NO_HW); 412503b705cfSriastradh assert(!kgem->wedged); 412603b705cfSriastradh 412703b705cfSriastradh assert(kgem->nbatch); 412803b705cfSriastradh assert(kgem->nbatch <= KGEM_BATCH_SIZE(kgem)); 412903b705cfSriastradh assert(kgem->nbatch <= kgem->surface); 413003b705cfSriastradh 413103b705cfSriastradh batch_end = kgem_end_batch(kgem); 413203b705cfSriastradh kgem_sna_flush(kgem); 413303b705cfSriastradh 41349a906b70Schristos DBG(("batch[%d/%d, flags=%x]: %d %d %d %d, nreloc=%d, nexec=%d, nfence=%d, aperture=%d [fenced=%d]\n", 41359a906b70Schristos kgem->mode, kgem->ring, kgem->batch_flags, 41369a906b70Schristos batch_end, kgem->nbatch, kgem->surface, kgem->batch_size, 41379a906b70Schristos kgem->nreloc, kgem->nexec, kgem->nfence, kgem->aperture, kgem->aperture_fenced)); 413803b705cfSriastradh 413903b705cfSriastradh assert(kgem->nbatch <= kgem->batch_size); 414003b705cfSriastradh assert(kgem->nbatch <= kgem->surface); 414103b705cfSriastradh assert(kgem->nreloc <= ARRAY_SIZE(kgem->reloc)); 414203b705cfSriastradh assert(kgem->nexec < ARRAY_SIZE(kgem->exec)); 414303b705cfSriastradh assert(kgem->nfence <= kgem->fence_max); 414403b705cfSriastradh 414503b705cfSriastradh kgem_finish_buffers(kgem); 414603b705cfSriastradh 41479a906b70Schristos#if SHOW_BATCH_BEFORE 414803b705cfSriastradh __kgem_batch_debug(kgem, batch_end); 414903b705cfSriastradh#endif 415003b705cfSriastradh 415103b705cfSriastradh rq = kgem->next_request; 4152813957e3Ssnj assert(rq->bo == NULL); 4153813957e3Ssnj 4154813957e3Ssnj rq->bo = kgem_create_batch(kgem); 415503b705cfSriastradh if (rq->bo) { 4156813957e3Ssnj struct drm_i915_gem_execbuffer2 execbuf; 415703b705cfSriastradh 415803b705cfSriastradh assert(!rq->bo->needs_flush); 415903b705cfSriastradh 416003b705cfSriastradh i = kgem->nexec++; 4161813957e3Ssnj kgem->exec[i].handle = rq->bo->handle; 416203b705cfSriastradh kgem->exec[i].relocation_count = kgem->nreloc; 416303b705cfSriastradh kgem->exec[i].relocs_ptr = (uintptr_t)kgem->reloc; 416403b705cfSriastradh kgem->exec[i].alignment = 0; 416503b705cfSriastradh kgem->exec[i].offset = rq->bo->presumed_offset; 416663ef14f0Smrg /* Make sure the kernel releases any fence, ignored if gen4+ */ 416763ef14f0Smrg kgem->exec[i].flags = EXEC_OBJECT_NEEDS_FENCE; 416803b705cfSriastradh kgem->exec[i].rsvd1 = 0; 416903b705cfSriastradh kgem->exec[i].rsvd2 = 0; 417003b705cfSriastradh 417103b705cfSriastradh rq->bo->exec = &kgem->exec[i]; 417203b705cfSriastradh rq->bo->rq = MAKE_REQUEST(rq, kgem->ring); /* useful sanity check */ 417303b705cfSriastradh list_add(&rq->bo->request, &rq->buffers); 417403b705cfSriastradh rq->ring = kgem->ring == KGEM_BLT; 417503b705cfSriastradh 4176813957e3Ssnj memset(&execbuf, 0, sizeof(execbuf)); 4177813957e3Ssnj execbuf.buffers_ptr = (uintptr_t)kgem->exec; 4178813957e3Ssnj execbuf.buffer_count = kgem->nexec; 417963ef14f0Smrg if (kgem->gen < 030) 418063ef14f0Smrg execbuf.batch_len = batch_end*sizeof(uint32_t); 4181813957e3Ssnj execbuf.flags = kgem->ring | kgem->batch_flags; 4182813957e3Ssnj 4183813957e3Ssnj if (DBG_DUMP) { 4184813957e3Ssnj int fd = open("/tmp/i915-batchbuffers.dump", 4185813957e3Ssnj O_WRONLY | O_CREAT | O_APPEND, 4186813957e3Ssnj 0666); 4187813957e3Ssnj if (fd != -1) { 4188813957e3Ssnj ret = write(fd, kgem->batch, batch_end*sizeof(uint32_t)); 4189813957e3Ssnj fd = close(fd); 419003b705cfSriastradh } 4191813957e3Ssnj } 419203b705cfSriastradh 4193813957e3Ssnj ret = do_execbuf(kgem, &execbuf); 419463ef14f0Smrg } else 419563ef14f0Smrg ret = -ENOMEM; 419603b705cfSriastradh 419763ef14f0Smrg if (ret < 0) { 419863ef14f0Smrg kgem_throttle(kgem); 419963ef14f0Smrg if (!kgem->wedged) { 420063ef14f0Smrg xf86DrvMsg(kgem_get_screen_index(kgem), X_ERROR, 420163ef14f0Smrg "Failed to submit rendering commands (%s), disabling acceleration.\n", 420263ef14f0Smrg strerror(-ret)); 420363ef14f0Smrg __kgem_set_wedged(kgem); 4204813957e3Ssnj } 420503b705cfSriastradh 420603b705cfSriastradh#if !NDEBUG 420763ef14f0Smrg ErrorF("batch[%d/%d]: %d %d %d, nreloc=%d, nexec=%d, nfence=%d, aperture=%d, fenced=%d, high=%d,%d: errno=%d\n", 420863ef14f0Smrg kgem->mode, kgem->ring, batch_end, kgem->nbatch, kgem->surface, 420963ef14f0Smrg kgem->nreloc, kgem->nexec, kgem->nfence, kgem->aperture, kgem->aperture_fenced, kgem->aperture_high, kgem->aperture_total, -ret); 421003b705cfSriastradh 421163ef14f0Smrg for (i = 0; i < kgem->nexec; i++) { 421263ef14f0Smrg struct kgem_bo *bo, *found = NULL; 421303b705cfSriastradh 421463ef14f0Smrg list_for_each_entry(bo, &kgem->next_request->buffers, request) { 421563ef14f0Smrg if (bo->handle == kgem->exec[i].handle) { 421663ef14f0Smrg found = bo; 421763ef14f0Smrg break; 421803b705cfSriastradh } 4219813957e3Ssnj } 422063ef14f0Smrg ErrorF("exec[%d] = handle:%d, presumed offset: %x, size: %d, tiling %d, fenced %d, snooped %d, deleted %d\n", 422163ef14f0Smrg i, 422263ef14f0Smrg kgem->exec[i].handle, 422363ef14f0Smrg (int)kgem->exec[i].offset, 422463ef14f0Smrg found ? kgem_bo_size(found) : -1, 422563ef14f0Smrg found ? found->tiling : -1, 422663ef14f0Smrg (int)(kgem->exec[i].flags & EXEC_OBJECT_NEEDS_FENCE), 422763ef14f0Smrg found ? found->snoop : -1, 422863ef14f0Smrg found ? found->purged : -1); 422963ef14f0Smrg } 423063ef14f0Smrg for (i = 0; i < kgem->nreloc; i++) { 423163ef14f0Smrg ErrorF("reloc[%d] = pos:%d, target:%d, delta:%d, read:%x, write:%x, offset:%x\n", 423263ef14f0Smrg i, 423363ef14f0Smrg (int)kgem->reloc[i].offset, 423463ef14f0Smrg kgem->reloc[i].target_handle, 423563ef14f0Smrg kgem->reloc[i].delta, 423663ef14f0Smrg kgem->reloc[i].read_domains, 423763ef14f0Smrg kgem->reloc[i].write_domain, 423863ef14f0Smrg (int)kgem->reloc[i].presumed_offset); 423963ef14f0Smrg } 424063ef14f0Smrg 424163ef14f0Smrg { 424263ef14f0Smrg struct drm_i915_gem_get_aperture aperture; 424363ef14f0Smrg if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_APERTURE, &aperture) == 0) 424463ef14f0Smrg ErrorF("Aperture size %lld, available %lld\n", 424563ef14f0Smrg (long long)aperture.aper_size, 424663ef14f0Smrg (long long)aperture.aper_available_size); 424763ef14f0Smrg } 424863ef14f0Smrg 424963ef14f0Smrg if (ret == -ENOSPC) 425063ef14f0Smrg dump_gtt_info(kgem); 425163ef14f0Smrg if (ret == -EDEADLK) 425263ef14f0Smrg dump_fence_regs(kgem); 425363ef14f0Smrg 425463ef14f0Smrg if (DEBUG_SYNC) { 425563ef14f0Smrg int fd = open("/tmp/batchbuffer", O_WRONLY | O_CREAT | O_APPEND, 0666); 425663ef14f0Smrg if (fd != -1) { 425763ef14f0Smrg int ignored = write(fd, kgem->batch, batch_end*sizeof(uint32_t)); 425863ef14f0Smrg assert(ignored == batch_end*sizeof(uint32_t)); 425963ef14f0Smrg close(fd); 4260813957e3Ssnj } 426103b705cfSriastradh 426263ef14f0Smrg FatalError("SNA: failed to submit batchbuffer, errno=%d\n", -ret); 426363ef14f0Smrg } 426463ef14f0Smrg#endif 426563ef14f0Smrg } else { 426663ef14f0Smrg if (DEBUG_SYNC) { 426763ef14f0Smrg struct drm_i915_gem_set_domain set_domain; 42689a906b70Schristos 426963ef14f0Smrg VG_CLEAR(set_domain); 427063ef14f0Smrg set_domain.handle = rq->bo->handle; 427163ef14f0Smrg set_domain.read_domains = I915_GEM_DOMAIN_GTT; 427263ef14f0Smrg set_domain.write_domain = I915_GEM_DOMAIN_GTT; 4273813957e3Ssnj 427463ef14f0Smrg ret = do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain); 427503b705cfSriastradh } 427663ef14f0Smrg 42779a906b70Schristos#if SHOW_BATCH_AFTER 427863ef14f0Smrg if (gem_read(kgem->fd, rq->bo->handle, kgem->batch, 0, batch_end*sizeof(uint32_t)) == 0) 427963ef14f0Smrg __kgem_batch_debug(kgem, batch_end); 42809a906b70Schristos#endif 428163ef14f0Smrg 428263ef14f0Smrg kgem_commit(kgem); 428363ef14f0Smrg } 428463ef14f0Smrg 428563ef14f0Smrg if (unlikely(kgem->wedged)) 428603b705cfSriastradh kgem_cleanup(kgem); 428703b705cfSriastradh 428803b705cfSriastradh kgem_reset(kgem); 428903b705cfSriastradh 429003b705cfSriastradh assert(kgem->next_request != NULL); 429103b705cfSriastradh} 429203b705cfSriastradh 429303b705cfSriastradhvoid kgem_throttle(struct kgem *kgem) 429403b705cfSriastradh{ 429563ef14f0Smrg if (unlikely(kgem->wedged)) 429603b705cfSriastradh return; 429703b705cfSriastradh 4298813957e3Ssnj if (__kgem_throttle(kgem, true)) { 429903b705cfSriastradh xf86DrvMsg(kgem_get_screen_index(kgem), X_ERROR, 430003b705cfSriastradh "Detected a hung GPU, disabling acceleration.\n"); 4301813957e3Ssnj __kgem_set_wedged(kgem); 43029a906b70Schristos kgem->need_throttle = false; 430303b705cfSriastradh } 430403b705cfSriastradh} 430503b705cfSriastradh 43069a906b70Schristosint kgem_is_wedged(struct kgem *kgem) 43079a906b70Schristos{ 43089a906b70Schristos return __kgem_throttle(kgem, true); 43099a906b70Schristos} 43109a906b70Schristos 43119a906b70Schristosstatic void kgem_purge_cache(struct kgem *kgem) 431203b705cfSriastradh{ 431303b705cfSriastradh struct kgem_bo *bo, *next; 431403b705cfSriastradh int i; 431503b705cfSriastradh 431603b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) { 431703b705cfSriastradh list_for_each_entry_safe(bo, next, &kgem->inactive[i], list) { 431803b705cfSriastradh if (!kgem_bo_is_retained(kgem, bo)) { 431903b705cfSriastradh DBG(("%s: purging %d\n", 432003b705cfSriastradh __FUNCTION__, bo->handle)); 432103b705cfSriastradh kgem_bo_free(kgem, bo); 432203b705cfSriastradh } 432303b705cfSriastradh } 432403b705cfSriastradh } 432503b705cfSriastradh 432603b705cfSriastradh kgem->need_purge = false; 432703b705cfSriastradh} 432803b705cfSriastradh 432903b705cfSriastradhvoid kgem_clean_scanout_cache(struct kgem *kgem) 433003b705cfSriastradh{ 433103b705cfSriastradh while (!list_is_empty(&kgem->scanout)) { 433203b705cfSriastradh struct kgem_bo *bo; 433303b705cfSriastradh 433403b705cfSriastradh bo = list_first_entry(&kgem->scanout, struct kgem_bo, list); 433503b705cfSriastradh 433603b705cfSriastradh assert(bo->scanout); 433703b705cfSriastradh assert(!bo->refcnt); 43389a906b70Schristos assert(!bo->prime); 433903b705cfSriastradh assert(bo->proxy == NULL); 434003b705cfSriastradh 434103b705cfSriastradh if (bo->exec || __kgem_busy(kgem, bo->handle)) 434203b705cfSriastradh break; 434303b705cfSriastradh 434403b705cfSriastradh DBG(("%s: handle=%d, fb=%d (reusable=%d)\n", 434503b705cfSriastradh __FUNCTION__, bo->handle, bo->delta, bo->reusable)); 434603b705cfSriastradh list_del(&bo->list); 434703b705cfSriastradh 43489a906b70Schristos kgem_bo_rmfb(kgem, bo); 434903b705cfSriastradh bo->scanout = false; 435003b705cfSriastradh 435103b705cfSriastradh if (!bo->purged) { 435203b705cfSriastradh bo->reusable = true; 435303b705cfSriastradh if (kgem->has_llc && 435403b705cfSriastradh !gem_set_caching(kgem->fd, bo->handle, SNOOPED)) 435503b705cfSriastradh bo->reusable = false; 435603b705cfSriastradh 435703b705cfSriastradh } 435803b705cfSriastradh 435903b705cfSriastradh __kgem_bo_destroy(kgem, bo); 436003b705cfSriastradh } 436103b705cfSriastradh} 436203b705cfSriastradh 436303b705cfSriastradhvoid kgem_clean_large_cache(struct kgem *kgem) 436403b705cfSriastradh{ 436503b705cfSriastradh while (!list_is_empty(&kgem->large_inactive)) { 436603b705cfSriastradh kgem_bo_free(kgem, 436703b705cfSriastradh list_first_entry(&kgem->large_inactive, 436803b705cfSriastradh struct kgem_bo, list)); 436903b705cfSriastradh 437003b705cfSriastradh } 437103b705cfSriastradh} 437203b705cfSriastradh 437303b705cfSriastradhbool kgem_expire_cache(struct kgem *kgem) 437403b705cfSriastradh{ 437503b705cfSriastradh time_t now, expire; 437603b705cfSriastradh struct kgem_bo *bo; 437703b705cfSriastradh unsigned int size = 0, count = 0; 437803b705cfSriastradh bool idle; 437903b705cfSriastradh unsigned int i; 438003b705cfSriastradh 438163ef14f0Smrg if (!time(&now)) 438263ef14f0Smrg return false; 438303b705cfSriastradh 438403b705cfSriastradh while (__kgem_freed_bo) { 438503b705cfSriastradh bo = __kgem_freed_bo; 438603b705cfSriastradh __kgem_freed_bo = *(struct kgem_bo **)bo; 438703b705cfSriastradh free(bo); 438803b705cfSriastradh } 438903b705cfSriastradh 439003b705cfSriastradh while (__kgem_freed_request) { 439103b705cfSriastradh struct kgem_request *rq = __kgem_freed_request; 439203b705cfSriastradh __kgem_freed_request = *(struct kgem_request **)rq; 439303b705cfSriastradh free(rq); 439403b705cfSriastradh } 439503b705cfSriastradh 439603b705cfSriastradh kgem_clean_large_cache(kgem); 439763ef14f0Smrg if (__to_sna(kgem)->scrn->vtSema) 439803b705cfSriastradh kgem_clean_scanout_cache(kgem); 439903b705cfSriastradh 440003b705cfSriastradh expire = 0; 440103b705cfSriastradh list_for_each_entry(bo, &kgem->snoop, list) { 440203b705cfSriastradh if (bo->delta) { 440303b705cfSriastradh expire = now - MAX_INACTIVE_TIME/2; 440403b705cfSriastradh break; 440503b705cfSriastradh } 440603b705cfSriastradh 440763ef14f0Smrg assert(now); 440803b705cfSriastradh bo->delta = now; 440903b705cfSriastradh } 441003b705cfSriastradh if (expire) { 441103b705cfSriastradh while (!list_is_empty(&kgem->snoop)) { 441203b705cfSriastradh bo = list_last_entry(&kgem->snoop, struct kgem_bo, list); 441303b705cfSriastradh 441403b705cfSriastradh if (bo->delta > expire) 441503b705cfSriastradh break; 441603b705cfSriastradh 441703b705cfSriastradh kgem_bo_free(kgem, bo); 441803b705cfSriastradh } 441903b705cfSriastradh } 442003b705cfSriastradh#ifdef DEBUG_MEMORY 442103b705cfSriastradh { 442203b705cfSriastradh long snoop_size = 0; 442303b705cfSriastradh int snoop_count = 0; 442403b705cfSriastradh list_for_each_entry(bo, &kgem->snoop, list) 442503b705cfSriastradh snoop_count++, snoop_size += bytes(bo); 44269a906b70Schristos DBG(("%s: still allocated %d bo, %ld bytes, in snoop cache\n", 44279a906b70Schristos __FUNCTION__, snoop_count, snoop_size)); 442803b705cfSriastradh } 442903b705cfSriastradh#endif 443003b705cfSriastradh 443103b705cfSriastradh kgem_retire(kgem); 443263ef14f0Smrg if (unlikely(kgem->wedged)) 443303b705cfSriastradh kgem_cleanup(kgem); 443403b705cfSriastradh 443503b705cfSriastradh kgem->expire(kgem); 443603b705cfSriastradh 443703b705cfSriastradh if (kgem->need_purge) 443803b705cfSriastradh kgem_purge_cache(kgem); 443903b705cfSriastradh 44409a906b70Schristos if (kgem->need_retire) 44419a906b70Schristos kgem_retire(kgem); 444203b705cfSriastradh 44439a906b70Schristos expire = 0; 44449a906b70Schristos idle = true; 444503b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) { 444603b705cfSriastradh idle &= list_is_empty(&kgem->inactive[i]); 444703b705cfSriastradh list_for_each_entry(bo, &kgem->inactive[i], list) { 444803b705cfSriastradh if (bo->delta) { 444903b705cfSriastradh expire = now - MAX_INACTIVE_TIME; 445003b705cfSriastradh break; 445103b705cfSriastradh } 445203b705cfSriastradh 445363ef14f0Smrg assert(now); 445463ef14f0Smrg kgem_bo_set_purgeable(kgem, bo); 445503b705cfSriastradh bo->delta = now; 445603b705cfSriastradh } 445703b705cfSriastradh } 44589a906b70Schristos if (expire == 0) { 44599a906b70Schristos DBG(("%s: idle? %d\n", __FUNCTION__, idle)); 44609a906b70Schristos kgem->need_expire = !idle; 446103b705cfSriastradh return false; 446203b705cfSriastradh } 446303b705cfSriastradh 44649a906b70Schristos idle = true; 446503b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) { 446603b705cfSriastradh struct list preserve; 446703b705cfSriastradh 446803b705cfSriastradh list_init(&preserve); 446903b705cfSriastradh while (!list_is_empty(&kgem->inactive[i])) { 447003b705cfSriastradh bo = list_last_entry(&kgem->inactive[i], 447103b705cfSriastradh struct kgem_bo, list); 447203b705cfSriastradh 447303b705cfSriastradh if (bo->delta > expire) { 447403b705cfSriastradh idle = false; 447503b705cfSriastradh break; 447603b705cfSriastradh } 447703b705cfSriastradh 44789a906b70Schristos if (bo->map__cpu && bo->delta + MAP_PRESERVE_TIME > expire) { 447903b705cfSriastradh idle = false; 448003b705cfSriastradh list_move_tail(&bo->list, &preserve); 448103b705cfSriastradh } else { 448203b705cfSriastradh count++; 448303b705cfSriastradh size += bytes(bo); 448403b705cfSriastradh kgem_bo_free(kgem, bo); 448563ef14f0Smrg DBG(("%s: expiring handle=%d\n", 448603b705cfSriastradh __FUNCTION__, bo->handle)); 448703b705cfSriastradh } 448803b705cfSriastradh } 448963ef14f0Smrg list_splice_tail(&preserve, &kgem->inactive[i]); 449003b705cfSriastradh } 449103b705cfSriastradh 449203b705cfSriastradh#ifdef DEBUG_MEMORY 449303b705cfSriastradh { 449403b705cfSriastradh long inactive_size = 0; 449503b705cfSriastradh int inactive_count = 0; 449603b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) 449703b705cfSriastradh list_for_each_entry(bo, &kgem->inactive[i], list) 449803b705cfSriastradh inactive_count++, inactive_size += bytes(bo); 44999a906b70Schristos DBG(("%s: still allocated %d bo, %ld bytes, in inactive cache\n", 45009a906b70Schristos __FUNCTION__, inactive_count, inactive_size)); 450103b705cfSriastradh } 450203b705cfSriastradh#endif 450303b705cfSriastradh 450403b705cfSriastradh DBG(("%s: expired %d objects, %d bytes, idle? %d\n", 450503b705cfSriastradh __FUNCTION__, count, size, idle)); 450603b705cfSriastradh 450703b705cfSriastradh kgem->need_expire = !idle; 45089a906b70Schristos return count; 450903b705cfSriastradh (void)count; 451003b705cfSriastradh (void)size; 451103b705cfSriastradh} 451203b705cfSriastradh 45139a906b70Schristosbool kgem_cleanup_cache(struct kgem *kgem) 451403b705cfSriastradh{ 451503b705cfSriastradh unsigned int i; 451603b705cfSriastradh int n; 451703b705cfSriastradh 451863ef14f0Smrg DBG(("%s\n", __FUNCTION__)); 451963ef14f0Smrg 452003b705cfSriastradh /* sync to the most recent request */ 452103b705cfSriastradh for (n = 0; n < ARRAY_SIZE(kgem->requests); n++) { 452203b705cfSriastradh if (!list_is_empty(&kgem->requests[n])) { 452303b705cfSriastradh struct kgem_request *rq; 452403b705cfSriastradh 452563ef14f0Smrg rq = list_last_entry(&kgem->requests[n], 452663ef14f0Smrg struct kgem_request, 452763ef14f0Smrg list); 452803b705cfSriastradh 452903b705cfSriastradh DBG(("%s: sync on cleanup\n", __FUNCTION__)); 453063ef14f0Smrg assert(rq->ring == n); 453163ef14f0Smrg assert(rq->bo); 453263ef14f0Smrg assert(RQ(rq->bo->rq) == rq); 453363ef14f0Smrg kgem_bo_wait(kgem, rq->bo); 453403b705cfSriastradh } 453563ef14f0Smrg assert(list_is_empty(&kgem->requests[n])); 453603b705cfSriastradh } 453703b705cfSriastradh 453803b705cfSriastradh kgem_retire(kgem); 453903b705cfSriastradh kgem_cleanup(kgem); 454003b705cfSriastradh 454163ef14f0Smrg DBG(("%s: need_expire?=%d\n", __FUNCTION__, kgem->need_expire)); 45429a906b70Schristos if (!kgem->need_expire) 45439a906b70Schristos return false; 45449a906b70Schristos 454503b705cfSriastradh for (i = 0; i < ARRAY_SIZE(kgem->inactive); i++) { 454603b705cfSriastradh while (!list_is_empty(&kgem->inactive[i])) 454703b705cfSriastradh kgem_bo_free(kgem, 454803b705cfSriastradh list_last_entry(&kgem->inactive[i], 454903b705cfSriastradh struct kgem_bo, list)); 455003b705cfSriastradh } 455103b705cfSriastradh 455203b705cfSriastradh kgem_clean_large_cache(kgem); 455303b705cfSriastradh kgem_clean_scanout_cache(kgem); 455403b705cfSriastradh 455503b705cfSriastradh while (!list_is_empty(&kgem->snoop)) 455603b705cfSriastradh kgem_bo_free(kgem, 455703b705cfSriastradh list_last_entry(&kgem->snoop, 455803b705cfSriastradh struct kgem_bo, list)); 455903b705cfSriastradh 456003b705cfSriastradh while (__kgem_freed_bo) { 456103b705cfSriastradh struct kgem_bo *bo = __kgem_freed_bo; 456203b705cfSriastradh __kgem_freed_bo = *(struct kgem_bo **)bo; 456303b705cfSriastradh free(bo); 456403b705cfSriastradh } 456503b705cfSriastradh 456603b705cfSriastradh kgem->need_purge = false; 456703b705cfSriastradh kgem->need_expire = false; 456863ef14f0Smrg 456963ef14f0Smrg DBG(("%s: complete\n", __FUNCTION__)); 45709a906b70Schristos return true; 457103b705cfSriastradh} 457203b705cfSriastradh 457303b705cfSriastradhstatic struct kgem_bo * 457403b705cfSriastradhsearch_linear_cache(struct kgem *kgem, unsigned int num_pages, unsigned flags) 457503b705cfSriastradh{ 457603b705cfSriastradh struct kgem_bo *bo, *first = NULL; 457703b705cfSriastradh bool use_active = (flags & CREATE_INACTIVE) == 0; 457803b705cfSriastradh struct list *cache; 457903b705cfSriastradh 458003b705cfSriastradh DBG(("%s: num_pages=%d, flags=%x, use_active? %d, use_large=%d [max=%d]\n", 458103b705cfSriastradh __FUNCTION__, num_pages, flags, use_active, 458203b705cfSriastradh num_pages >= MAX_CACHE_SIZE / PAGE_SIZE, 458303b705cfSriastradh MAX_CACHE_SIZE / PAGE_SIZE)); 458403b705cfSriastradh 458503b705cfSriastradh assert(num_pages); 458603b705cfSriastradh 458703b705cfSriastradh if (num_pages >= MAX_CACHE_SIZE / PAGE_SIZE) { 458803b705cfSriastradh DBG(("%s: searching large buffers\n", __FUNCTION__)); 458903b705cfSriastradhretry_large: 459003b705cfSriastradh cache = use_active ? &kgem->large : &kgem->large_inactive; 459103b705cfSriastradh list_for_each_entry_safe(bo, first, cache, list) { 459203b705cfSriastradh assert(bo->refcnt == 0); 459303b705cfSriastradh assert(bo->reusable); 459403b705cfSriastradh assert(!bo->scanout); 459503b705cfSriastradh 459603b705cfSriastradh if (num_pages > num_pages(bo)) 459703b705cfSriastradh goto discard; 459803b705cfSriastradh 459903b705cfSriastradh if (bo->tiling != I915_TILING_NONE) { 460063ef14f0Smrg if (use_active && kgem->gen < 040) 460103b705cfSriastradh goto discard; 460203b705cfSriastradh 460363ef14f0Smrg if (!kgem_set_tiling(kgem, bo, 460403b705cfSriastradh I915_TILING_NONE, 0)) 460503b705cfSriastradh goto discard; 460603b705cfSriastradh } 460763ef14f0Smrg assert(bo->tiling == I915_TILING_NONE); 460863ef14f0Smrg bo->pitch = 0; 460903b705cfSriastradh 461003b705cfSriastradh if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) 461103b705cfSriastradh goto discard; 461203b705cfSriastradh 461303b705cfSriastradh list_del(&bo->list); 46149a906b70Schristos if (RQ(bo->rq) == (void *)kgem) { 46159a906b70Schristos assert(bo->exec == NULL); 461603b705cfSriastradh list_del(&bo->request); 46179a906b70Schristos } 461803b705cfSriastradh 461903b705cfSriastradh bo->delta = 0; 462003b705cfSriastradh assert_tiling(kgem, bo); 462103b705cfSriastradh return bo; 462203b705cfSriastradh 462303b705cfSriastradhdiscard: 462403b705cfSriastradh if (!use_active) 462503b705cfSriastradh kgem_bo_free(kgem, bo); 462603b705cfSriastradh } 462703b705cfSriastradh 462803b705cfSriastradh if (use_active) { 462903b705cfSriastradh use_active = false; 463003b705cfSriastradh goto retry_large; 463103b705cfSriastradh } 463203b705cfSriastradh 463303b705cfSriastradh if (__kgem_throttle_retire(kgem, flags)) 463403b705cfSriastradh goto retry_large; 463503b705cfSriastradh 463603b705cfSriastradh return NULL; 463703b705cfSriastradh } 463803b705cfSriastradh 463903b705cfSriastradh if (!use_active && list_is_empty(inactive(kgem, num_pages))) { 464003b705cfSriastradh DBG(("%s: inactive and cache bucket empty\n", 464103b705cfSriastradh __FUNCTION__)); 464203b705cfSriastradh 464303b705cfSriastradh if (flags & CREATE_NO_RETIRE) { 464403b705cfSriastradh DBG(("%s: can not retire\n", __FUNCTION__)); 464503b705cfSriastradh return NULL; 464603b705cfSriastradh } 464703b705cfSriastradh 464803b705cfSriastradh if (list_is_empty(active(kgem, num_pages, I915_TILING_NONE))) { 464903b705cfSriastradh DBG(("%s: active cache bucket empty\n", __FUNCTION__)); 465003b705cfSriastradh return NULL; 465103b705cfSriastradh } 465203b705cfSriastradh 465303b705cfSriastradh if (!__kgem_throttle_retire(kgem, flags)) { 465403b705cfSriastradh DBG(("%s: nothing retired\n", __FUNCTION__)); 465503b705cfSriastradh return NULL; 465603b705cfSriastradh } 465703b705cfSriastradh 465803b705cfSriastradh if (list_is_empty(inactive(kgem, num_pages))) { 465903b705cfSriastradh DBG(("%s: active cache bucket still empty after retire\n", 466003b705cfSriastradh __FUNCTION__)); 466103b705cfSriastradh return NULL; 466203b705cfSriastradh } 466303b705cfSriastradh } 466403b705cfSriastradh 466503b705cfSriastradh if (!use_active && flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) { 466603b705cfSriastradh int for_cpu = !!(flags & CREATE_CPU_MAP); 466703b705cfSriastradh DBG(("%s: searching for inactive %s map\n", 466803b705cfSriastradh __FUNCTION__, for_cpu ? "cpu" : "gtt")); 466903b705cfSriastradh cache = &kgem->vma[for_cpu].inactive[cache_bucket(num_pages)]; 467003b705cfSriastradh list_for_each_entry(bo, cache, vma) { 4671813957e3Ssnj assert(for_cpu ? !!bo->map__cpu : (bo->map__gtt || bo->map__wc)); 467203b705cfSriastradh assert(bucket(bo) == cache_bucket(num_pages)); 467303b705cfSriastradh assert(bo->proxy == NULL); 467403b705cfSriastradh assert(bo->rq == NULL); 467503b705cfSriastradh assert(bo->exec == NULL); 467603b705cfSriastradh assert(!bo->scanout); 467703b705cfSriastradh 467803b705cfSriastradh if (num_pages > num_pages(bo)) { 467903b705cfSriastradh DBG(("inactive too small: %d < %d\n", 468003b705cfSriastradh num_pages(bo), num_pages)); 468103b705cfSriastradh continue; 468203b705cfSriastradh } 468303b705cfSriastradh 468403b705cfSriastradh if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) { 468503b705cfSriastradh kgem_bo_free(kgem, bo); 468603b705cfSriastradh break; 468703b705cfSriastradh } 468803b705cfSriastradh 468963ef14f0Smrg if (!kgem_set_tiling(kgem, bo, I915_TILING_NONE, 0)) { 469063ef14f0Smrg kgem_bo_free(kgem, bo); 469163ef14f0Smrg break; 469263ef14f0Smrg } 469303b705cfSriastradh 469403b705cfSriastradh kgem_bo_remove_from_inactive(kgem, bo); 46959a906b70Schristos assert(list_is_empty(&bo->vma)); 46969a906b70Schristos assert(list_is_empty(&bo->list)); 469703b705cfSriastradh 469863ef14f0Smrg assert(bo->tiling == I915_TILING_NONE); 469963ef14f0Smrg assert(bo->pitch == 0); 470003b705cfSriastradh bo->delta = 0; 470103b705cfSriastradh DBG((" %s: found handle=%d (num_pages=%d) in linear vma cache\n", 470203b705cfSriastradh __FUNCTION__, bo->handle, num_pages(bo))); 470303b705cfSriastradh assert(use_active || bo->domain != DOMAIN_GPU); 470403b705cfSriastradh assert(!bo->needs_flush); 470503b705cfSriastradh assert_tiling(kgem, bo); 470603b705cfSriastradh ASSERT_MAYBE_IDLE(kgem, bo->handle, !use_active); 470703b705cfSriastradh return bo; 470803b705cfSriastradh } 470903b705cfSriastradh 471003b705cfSriastradh if (flags & CREATE_EXACT) 471103b705cfSriastradh return NULL; 471203b705cfSriastradh 471303b705cfSriastradh if (flags & CREATE_CPU_MAP && !kgem->has_llc) 471403b705cfSriastradh return NULL; 471503b705cfSriastradh } 471603b705cfSriastradh 471703b705cfSriastradh cache = use_active ? active(kgem, num_pages, I915_TILING_NONE) : inactive(kgem, num_pages); 471803b705cfSriastradh list_for_each_entry(bo, cache, list) { 471903b705cfSriastradh assert(bo->refcnt == 0); 472003b705cfSriastradh assert(bo->reusable); 472103b705cfSriastradh assert(!!bo->rq == !!use_active); 472203b705cfSriastradh assert(bo->proxy == NULL); 472303b705cfSriastradh assert(!bo->scanout); 472403b705cfSriastradh 472503b705cfSriastradh if (num_pages > num_pages(bo)) 472603b705cfSriastradh continue; 472703b705cfSriastradh 472803b705cfSriastradh if (use_active && 472903b705cfSriastradh kgem->gen <= 040 && 473003b705cfSriastradh bo->tiling != I915_TILING_NONE) 473103b705cfSriastradh continue; 473203b705cfSriastradh 473303b705cfSriastradh if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) { 473403b705cfSriastradh kgem_bo_free(kgem, bo); 473503b705cfSriastradh break; 473603b705cfSriastradh } 473703b705cfSriastradh 473803b705cfSriastradh if (I915_TILING_NONE != bo->tiling) { 473903b705cfSriastradh if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) 474003b705cfSriastradh continue; 474103b705cfSriastradh 474203b705cfSriastradh if (first) 474303b705cfSriastradh continue; 474403b705cfSriastradh 474563ef14f0Smrg if (!kgem_set_tiling(kgem, bo, I915_TILING_NONE, 0)) 474603b705cfSriastradh continue; 474703b705cfSriastradh } 474863ef14f0Smrg assert(bo->tiling == I915_TILING_NONE); 474963ef14f0Smrg bo->pitch = 0; 475003b705cfSriastradh 4751813957e3Ssnj if (bo->map__gtt || bo->map__wc || bo->map__cpu) { 475203b705cfSriastradh if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) { 475303b705cfSriastradh int for_cpu = !!(flags & CREATE_CPU_MAP); 4754813957e3Ssnj if (for_cpu ? !!bo->map__cpu : (bo->map__gtt || bo->map__wc)){ 475503b705cfSriastradh if (first != NULL) 475603b705cfSriastradh break; 475703b705cfSriastradh 475803b705cfSriastradh first = bo; 475903b705cfSriastradh continue; 476003b705cfSriastradh } 476103b705cfSriastradh } else { 476203b705cfSriastradh if (first != NULL) 476303b705cfSriastradh break; 476403b705cfSriastradh 476503b705cfSriastradh first = bo; 476603b705cfSriastradh continue; 476703b705cfSriastradh } 476803b705cfSriastradh } else { 47699a906b70Schristos if (flags & CREATE_GTT_MAP && !kgem_bo_can_map(kgem, bo)) 47709a906b70Schristos continue; 47719a906b70Schristos 477203b705cfSriastradh if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) { 477303b705cfSriastradh if (first != NULL) 477403b705cfSriastradh break; 477503b705cfSriastradh 477603b705cfSriastradh first = bo; 477703b705cfSriastradh continue; 477803b705cfSriastradh } 477903b705cfSriastradh } 478003b705cfSriastradh 478103b705cfSriastradh if (use_active) 478203b705cfSriastradh kgem_bo_remove_from_active(kgem, bo); 478303b705cfSriastradh else 478403b705cfSriastradh kgem_bo_remove_from_inactive(kgem, bo); 478503b705cfSriastradh 478603b705cfSriastradh assert(bo->tiling == I915_TILING_NONE); 478763ef14f0Smrg assert(bo->pitch == 0); 478803b705cfSriastradh bo->delta = 0; 478903b705cfSriastradh DBG((" %s: found handle=%d (num_pages=%d) in linear %s cache\n", 479003b705cfSriastradh __FUNCTION__, bo->handle, num_pages(bo), 479103b705cfSriastradh use_active ? "active" : "inactive")); 479203b705cfSriastradh assert(list_is_empty(&bo->list)); 47939a906b70Schristos assert(list_is_empty(&bo->vma)); 479403b705cfSriastradh assert(use_active || bo->domain != DOMAIN_GPU); 479503b705cfSriastradh assert(!bo->needs_flush || use_active); 479603b705cfSriastradh assert_tiling(kgem, bo); 479703b705cfSriastradh ASSERT_MAYBE_IDLE(kgem, bo->handle, !use_active); 479803b705cfSriastradh return bo; 479903b705cfSriastradh } 480003b705cfSriastradh 480103b705cfSriastradh if (first) { 480203b705cfSriastradh assert(first->tiling == I915_TILING_NONE); 480303b705cfSriastradh 480403b705cfSriastradh if (use_active) 480503b705cfSriastradh kgem_bo_remove_from_active(kgem, first); 480603b705cfSriastradh else 480703b705cfSriastradh kgem_bo_remove_from_inactive(kgem, first); 480803b705cfSriastradh 480903b705cfSriastradh first->pitch = 0; 481003b705cfSriastradh first->delta = 0; 481103b705cfSriastradh DBG((" %s: found handle=%d (near-miss) (num_pages=%d) in linear %s cache\n", 481203b705cfSriastradh __FUNCTION__, first->handle, num_pages(first), 481303b705cfSriastradh use_active ? "active" : "inactive")); 481403b705cfSriastradh assert(list_is_empty(&first->list)); 48159a906b70Schristos assert(list_is_empty(&first->vma)); 481603b705cfSriastradh assert(use_active || first->domain != DOMAIN_GPU); 481703b705cfSriastradh assert(!first->needs_flush || use_active); 481803b705cfSriastradh ASSERT_MAYBE_IDLE(kgem, first->handle, !use_active); 481903b705cfSriastradh return first; 482003b705cfSriastradh } 482103b705cfSriastradh 482203b705cfSriastradh return NULL; 482303b705cfSriastradh} 482403b705cfSriastradh 482503b705cfSriastradhstruct kgem_bo *kgem_create_for_name(struct kgem *kgem, uint32_t name) 482603b705cfSriastradh{ 482703b705cfSriastradh struct drm_gem_open open_arg; 48289a906b70Schristos struct drm_i915_gem_get_tiling tiling; 482903b705cfSriastradh struct kgem_bo *bo; 483003b705cfSriastradh 483103b705cfSriastradh DBG(("%s(name=%d)\n", __FUNCTION__, name)); 483203b705cfSriastradh 483303b705cfSriastradh VG_CLEAR(open_arg); 483403b705cfSriastradh open_arg.name = name; 48359a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_GEM_OPEN, &open_arg)) 483603b705cfSriastradh return NULL; 483703b705cfSriastradh 483803b705cfSriastradh DBG(("%s: new handle=%d\n", __FUNCTION__, open_arg.handle)); 48399a906b70Schristos 48409a906b70Schristos VG_CLEAR(tiling); 48419a906b70Schristos tiling.handle = open_arg.handle; 48429a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling)) { 48439a906b70Schristos DBG(("%s(name=%d) get-tiling failed, ret=%d\n", __FUNCTION__, name, errno)); 48449a906b70Schristos gem_close(kgem->fd, open_arg.handle); 48459a906b70Schristos return NULL; 48469a906b70Schristos } 48479a906b70Schristos 48489a906b70Schristos DBG(("%s: handle=%d, tiling=%d\n", __FUNCTION__, tiling.handle, tiling.tiling_mode)); 48499a906b70Schristos 485003b705cfSriastradh bo = __kgem_bo_alloc(open_arg.handle, open_arg.size / PAGE_SIZE); 485103b705cfSriastradh if (bo == NULL) { 485203b705cfSriastradh gem_close(kgem->fd, open_arg.handle); 485303b705cfSriastradh return NULL; 485403b705cfSriastradh } 485503b705cfSriastradh 48569a906b70Schristos bo->unique_id = kgem_get_unique_id(kgem); 48579a906b70Schristos bo->tiling = tiling.tiling_mode; 48589a906b70Schristos bo->prime = true; 485963ef14f0Smrg bo->reusable = false; 486063ef14f0Smrg kgem_bo_unclean(kgem, bo); 486103b705cfSriastradh 486203b705cfSriastradh debug_alloc__bo(kgem, bo); 486303b705cfSriastradh return bo; 486403b705cfSriastradh} 486503b705cfSriastradh 486603b705cfSriastradhstruct kgem_bo *kgem_create_for_prime(struct kgem *kgem, int name, uint32_t size) 486703b705cfSriastradh{ 486803b705cfSriastradh#ifdef DRM_IOCTL_PRIME_FD_TO_HANDLE 486903b705cfSriastradh struct drm_prime_handle args; 487003b705cfSriastradh struct drm_i915_gem_get_tiling tiling; 48719a906b70Schristos struct local_i915_gem_caching caching; 487203b705cfSriastradh struct kgem_bo *bo; 48739a906b70Schristos off_t seek; 487403b705cfSriastradh 487503b705cfSriastradh DBG(("%s(name=%d)\n", __FUNCTION__, name)); 487603b705cfSriastradh 487703b705cfSriastradh VG_CLEAR(args); 487803b705cfSriastradh args.fd = name; 487903b705cfSriastradh args.flags = 0; 48809a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_PRIME_FD_TO_HANDLE, &args)) { 48819a906b70Schristos DBG(("%s(name=%d) fd-to-handle failed, ret=%d\n", __FUNCTION__, name, errno)); 488203b705cfSriastradh return NULL; 48839a906b70Schristos } 488403b705cfSriastradh 488503b705cfSriastradh VG_CLEAR(tiling); 488603b705cfSriastradh tiling.handle = args.handle; 48879a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling)) { 48889a906b70Schristos DBG(("%s(name=%d) get-tiling failed, ret=%d\n", __FUNCTION__, name, errno)); 488903b705cfSriastradh gem_close(kgem->fd, args.handle); 489003b705cfSriastradh return NULL; 489103b705cfSriastradh } 489203b705cfSriastradh 48939a906b70Schristos /* Query actual size, overriding specified if available */ 48949a906b70Schristos seek = lseek(args.fd, 0, SEEK_END); 48959a906b70Schristos DBG(("%s: estimated size=%ld, actual=%lld\n", 48969a906b70Schristos __FUNCTION__, (long)size, (long long)seek)); 48979a906b70Schristos if (seek != -1) { 48989a906b70Schristos if (size > seek) { 48999a906b70Schristos DBG(("%s(name=%d) estimated required size [%d] is larger than actual [%ld]\n", __FUNCTION__, name, size, (long)seek)); 49009a906b70Schristos gem_close(kgem->fd, args.handle); 49019a906b70Schristos return NULL; 49029a906b70Schristos } 49039a906b70Schristos size = seek; 49049a906b70Schristos } 49059a906b70Schristos 490603b705cfSriastradh DBG(("%s: new handle=%d, tiling=%d\n", __FUNCTION__, 490703b705cfSriastradh args.handle, tiling.tiling_mode)); 490803b705cfSriastradh bo = __kgem_bo_alloc(args.handle, NUM_PAGES(size)); 490903b705cfSriastradh if (bo == NULL) { 491003b705cfSriastradh gem_close(kgem->fd, args.handle); 491103b705cfSriastradh return NULL; 491203b705cfSriastradh } 491303b705cfSriastradh 49149a906b70Schristos bo->unique_id = kgem_get_unique_id(kgem); 491503b705cfSriastradh bo->tiling = tiling.tiling_mode; 491603b705cfSriastradh bo->reusable = false; 49179a906b70Schristos bo->prime = true; 49189a906b70Schristos bo->domain = DOMAIN_NONE; 49199a906b70Schristos 49209a906b70Schristos /* is this a special bo (e.g. scanout or CPU coherent)? */ 49219a906b70Schristos 49229a906b70Schristos VG_CLEAR(caching); 49239a906b70Schristos caching.handle = args.handle; 49249a906b70Schristos caching.caching = kgem->has_llc; 49259a906b70Schristos (void)drmIoctl(kgem->fd, LOCAL_IOCTL_I915_GEM_GET_CACHING, &caching); 49269a906b70Schristos DBG(("%s: imported handle=%d has caching %d\n", __FUNCTION__, args.handle, caching.caching)); 49279a906b70Schristos switch (caching.caching) { 49289a906b70Schristos case 0: 49299a906b70Schristos if (kgem->has_llc) { 49309a906b70Schristos DBG(("%s: interpreting handle=%d as a foreign scanout\n", 49319a906b70Schristos __FUNCTION__, args.handle)); 49329a906b70Schristos bo->scanout = true; 49339a906b70Schristos } 49349a906b70Schristos break; 49359a906b70Schristos case 1: 49369a906b70Schristos if (!kgem->has_llc) { 49379a906b70Schristos DBG(("%s: interpreting handle=%d as a foreign snooped buffer\n", 49389a906b70Schristos __FUNCTION__, args.handle)); 49399a906b70Schristos bo->snoop = true; 49409a906b70Schristos if (bo->tiling) { 49419a906b70Schristos DBG(("%s: illegal snooped tiled buffer\n", __FUNCTION__)); 49429a906b70Schristos kgem_bo_free(kgem, bo); 49439a906b70Schristos return NULL; 49449a906b70Schristos } 49459a906b70Schristos } 49469a906b70Schristos break; 49479a906b70Schristos case 2: 49489a906b70Schristos DBG(("%s: interpreting handle=%d as a foreign scanout\n", 49499a906b70Schristos __FUNCTION__, args.handle)); 49509a906b70Schristos bo->scanout = true; 49519a906b70Schristos break; 49529a906b70Schristos } 495303b705cfSriastradh 495403b705cfSriastradh debug_alloc__bo(kgem, bo); 495503b705cfSriastradh return bo; 495603b705cfSriastradh#else 495703b705cfSriastradh return NULL; 495803b705cfSriastradh#endif 495903b705cfSriastradh} 496003b705cfSriastradh 496103b705cfSriastradhint kgem_bo_export_to_prime(struct kgem *kgem, struct kgem_bo *bo) 496203b705cfSriastradh{ 496303b705cfSriastradh#if defined(DRM_IOCTL_PRIME_HANDLE_TO_FD) && defined(O_CLOEXEC) 496403b705cfSriastradh struct drm_prime_handle args; 496503b705cfSriastradh 496663ef14f0Smrg assert(kgem_bo_is_fenced(kgem, bo)); 496763ef14f0Smrg 496803b705cfSriastradh VG_CLEAR(args); 496903b705cfSriastradh args.handle = bo->handle; 497003b705cfSriastradh args.flags = O_CLOEXEC; 497103b705cfSriastradh 49729a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_PRIME_HANDLE_TO_FD, &args)) 497303b705cfSriastradh return -1; 497403b705cfSriastradh 497503b705cfSriastradh bo->reusable = false; 497603b705cfSriastradh return args.fd; 497703b705cfSriastradh#else 497803b705cfSriastradh return -1; 497903b705cfSriastradh#endif 498003b705cfSriastradh} 498103b705cfSriastradh 498203b705cfSriastradhstruct kgem_bo *kgem_create_linear(struct kgem *kgem, int size, unsigned flags) 498303b705cfSriastradh{ 498403b705cfSriastradh struct kgem_bo *bo; 498503b705cfSriastradh uint32_t handle; 498603b705cfSriastradh 498703b705cfSriastradh DBG(("%s(%d)\n", __FUNCTION__, size)); 498803b705cfSriastradh assert(size); 498903b705cfSriastradh 499003b705cfSriastradh if (flags & CREATE_GTT_MAP && kgem->has_llc) { 499103b705cfSriastradh flags &= ~CREATE_GTT_MAP; 499203b705cfSriastradh flags |= CREATE_CPU_MAP; 499303b705cfSriastradh } 499403b705cfSriastradh 499503b705cfSriastradh size = NUM_PAGES(size); 4996813957e3Ssnj if ((flags & CREATE_UNCACHED) == 0) { 4997813957e3Ssnj bo = search_linear_cache(kgem, size, CREATE_INACTIVE | flags); 4998813957e3Ssnj if (bo) { 499963ef14f0Smrg assert(!bo->purged); 500063ef14f0Smrg assert(!bo->delta); 5001813957e3Ssnj assert(bo->domain != DOMAIN_GPU); 5002813957e3Ssnj ASSERT_IDLE(kgem, bo->handle); 5003813957e3Ssnj bo->refcnt = 1; 5004813957e3Ssnj return bo; 5005813957e3Ssnj } 500603b705cfSriastradh 5007813957e3Ssnj if (flags & CREATE_CACHED) 5008813957e3Ssnj return NULL; 5009813957e3Ssnj } 501003b705cfSriastradh 501103b705cfSriastradh handle = gem_create(kgem->fd, size); 501203b705cfSriastradh if (handle == 0) 501303b705cfSriastradh return NULL; 501403b705cfSriastradh 501503b705cfSriastradh DBG(("%s: new handle=%d, num_pages=%d\n", __FUNCTION__, handle, size)); 501603b705cfSriastradh bo = __kgem_bo_alloc(handle, size); 501703b705cfSriastradh if (bo == NULL) { 501803b705cfSriastradh gem_close(kgem->fd, handle); 501903b705cfSriastradh return NULL; 502003b705cfSriastradh } 502103b705cfSriastradh 502203b705cfSriastradh debug_alloc__bo(kgem, bo); 502303b705cfSriastradh return bo; 502403b705cfSriastradh} 502503b705cfSriastradh 502603b705cfSriastradhint kgem_choose_tiling(struct kgem *kgem, int tiling, int width, int height, int bpp) 502703b705cfSriastradh{ 502803b705cfSriastradh if (DBG_NO_TILING) 502903b705cfSriastradh return tiling < 0 ? tiling : I915_TILING_NONE; 503003b705cfSriastradh 503103b705cfSriastradh if (kgem->gen < 040) { 503203b705cfSriastradh if (tiling && width * bpp > 8192 * 8) { 503303b705cfSriastradh DBG(("%s: pitch too large for tliing [%d]\n", 503403b705cfSriastradh __FUNCTION__, width*bpp/8)); 503503b705cfSriastradh tiling = I915_TILING_NONE; 503603b705cfSriastradh goto done; 503703b705cfSriastradh } 503803b705cfSriastradh } else { 503903b705cfSriastradh if (width*bpp > (MAXSHORT-512) * 8) { 504003b705cfSriastradh if (tiling > 0) 504103b705cfSriastradh tiling = -tiling; 504203b705cfSriastradh else if (tiling == 0) 504303b705cfSriastradh tiling = -I915_TILING_X; 504403b705cfSriastradh DBG(("%s: large pitch [%d], forcing TILING [%d]\n", 504503b705cfSriastradh __FUNCTION__, width*bpp/8, tiling)); 504603b705cfSriastradh } else if (tiling && (width|height) > 8192) { 504703b705cfSriastradh DBG(("%s: large tiled buffer [%dx%d], forcing TILING_X\n", 504803b705cfSriastradh __FUNCTION__, width, height)); 504903b705cfSriastradh tiling = -I915_TILING_X; 505003b705cfSriastradh } 505103b705cfSriastradh 505203b705cfSriastradh /* fences limited to 128k (256k on ivb) */ 505303b705cfSriastradh assert(width * bpp <= 128 * 1024 * 8); 505403b705cfSriastradh } 505503b705cfSriastradh 505603b705cfSriastradh if (tiling < 0) 505703b705cfSriastradh return tiling; 505803b705cfSriastradh 50599a906b70Schristos if (tiling == I915_TILING_Y && !kgem->can_render_y) 50609a906b70Schristos tiling = I915_TILING_X; 50619a906b70Schristos 506203b705cfSriastradh if (tiling && (height == 1 || width == 1)) { 506303b705cfSriastradh DBG(("%s: disabling tiling [%dx%d] for single row/col\n", 506403b705cfSriastradh __FUNCTION__,width, height)); 506503b705cfSriastradh tiling = I915_TILING_NONE; 506603b705cfSriastradh goto done; 506703b705cfSriastradh } 506803b705cfSriastradh if (tiling == I915_TILING_Y && height <= 16) { 506903b705cfSriastradh DBG(("%s: too short [%d] for TILING_Y\n", 507003b705cfSriastradh __FUNCTION__,height)); 507103b705cfSriastradh tiling = I915_TILING_X; 507203b705cfSriastradh } 507303b705cfSriastradh if (tiling && width * bpp > 8 * (4096 - 64)) { 507403b705cfSriastradh DBG(("%s: TLB miss between lines %dx%d (pitch=%d), forcing tiling %d\n", 507503b705cfSriastradh __FUNCTION__, 507603b705cfSriastradh width, height, width*bpp/8, 507703b705cfSriastradh tiling)); 507803b705cfSriastradh return -tiling; 507903b705cfSriastradh } 508003b705cfSriastradh if (tiling == I915_TILING_X && height < 4) { 508103b705cfSriastradh DBG(("%s: too short [%d] for TILING_X\n", 508203b705cfSriastradh __FUNCTION__, height)); 508303b705cfSriastradh tiling = I915_TILING_NONE; 508403b705cfSriastradh goto done; 508503b705cfSriastradh } 508603b705cfSriastradh 50879a906b70Schristos if (tiling == I915_TILING_X && width * bpp <= 8*512) { 508803b705cfSriastradh DBG(("%s: too thin [width %d, %d bpp] for TILING_X\n", 508903b705cfSriastradh __FUNCTION__, width, bpp)); 509003b705cfSriastradh tiling = I915_TILING_NONE; 509103b705cfSriastradh goto done; 509203b705cfSriastradh } 50939a906b70Schristos if (tiling == I915_TILING_Y && width * bpp < 8*128) { 509403b705cfSriastradh DBG(("%s: too thin [%d] for TILING_Y\n", 509503b705cfSriastradh __FUNCTION__, width)); 509603b705cfSriastradh tiling = I915_TILING_NONE; 509703b705cfSriastradh goto done; 509803b705cfSriastradh } 509903b705cfSriastradh 510003b705cfSriastradh if (tiling && ALIGN(height, 2) * ALIGN(width*bpp, 8*64) <= 4096 * 8) { 510103b705cfSriastradh DBG(("%s: too small [%d bytes] for TILING_%c\n", __FUNCTION__, 510203b705cfSriastradh ALIGN(height, 2) * ALIGN(width*bpp, 8*64) / 8, 510303b705cfSriastradh tiling == I915_TILING_X ? 'X' : 'Y')); 510403b705cfSriastradh tiling = I915_TILING_NONE; 510503b705cfSriastradh goto done; 510603b705cfSriastradh } 510703b705cfSriastradh 510803b705cfSriastradh if (tiling && width * bpp >= 8 * 4096 / 2) { 510903b705cfSriastradh DBG(("%s: TLB near-miss between lines %dx%d (pitch=%d), forcing tiling %d\n", 511003b705cfSriastradh __FUNCTION__, 511103b705cfSriastradh width, height, width*bpp/8, 511203b705cfSriastradh tiling)); 511303b705cfSriastradh return -tiling; 511403b705cfSriastradh } 511503b705cfSriastradh 511603b705cfSriastradhdone: 511703b705cfSriastradh DBG(("%s: %dx%d -> %d\n", __FUNCTION__, width, height, tiling)); 511803b705cfSriastradh return tiling; 511903b705cfSriastradh} 512003b705cfSriastradh 512103b705cfSriastradhstatic int bits_per_pixel(int depth) 512203b705cfSriastradh{ 512303b705cfSriastradh switch (depth) { 512403b705cfSriastradh case 8: return 8; 512503b705cfSriastradh case 15: 512603b705cfSriastradh case 16: return 16; 512703b705cfSriastradh case 24: 512803b705cfSriastradh case 30: 512903b705cfSriastradh case 32: return 32; 513003b705cfSriastradh default: return 0; 513103b705cfSriastradh } 513203b705cfSriastradh} 513303b705cfSriastradh 513403b705cfSriastradhunsigned kgem_can_create_2d(struct kgem *kgem, 513503b705cfSriastradh int width, int height, int depth) 513603b705cfSriastradh{ 513703b705cfSriastradh uint32_t pitch, size; 513803b705cfSriastradh unsigned flags = 0; 513903b705cfSriastradh int tiling; 514003b705cfSriastradh int bpp; 514103b705cfSriastradh 514203b705cfSriastradh DBG(("%s: %dx%d @ %d\n", __FUNCTION__, width, height, depth)); 514303b705cfSriastradh 514403b705cfSriastradh bpp = bits_per_pixel(depth); 514503b705cfSriastradh if (bpp == 0) { 514603b705cfSriastradh DBG(("%s: unhandled depth %d\n", __FUNCTION__, depth)); 514703b705cfSriastradh return 0; 514803b705cfSriastradh } 514903b705cfSriastradh 515003b705cfSriastradh if (width > MAXSHORT || height > MAXSHORT) { 515103b705cfSriastradh DBG(("%s: unhandled size %dx%d\n", 515203b705cfSriastradh __FUNCTION__, width, height)); 515303b705cfSriastradh return 0; 515403b705cfSriastradh } 515503b705cfSriastradh 515603b705cfSriastradh size = kgem_surface_size(kgem, false, 0, 515703b705cfSriastradh width, height, bpp, 515803b705cfSriastradh I915_TILING_NONE, &pitch); 515903b705cfSriastradh DBG(("%s: untiled size=%d\n", __FUNCTION__, size)); 516003b705cfSriastradh if (size > 0) { 516103b705cfSriastradh if (size <= kgem->max_cpu_size) 516203b705cfSriastradh flags |= KGEM_CAN_CREATE_CPU; 51639a906b70Schristos if (size > 4096 && size <= kgem->max_gpu_size) 516403b705cfSriastradh flags |= KGEM_CAN_CREATE_GPU; 5165813957e3Ssnj if (size <= PAGE_SIZE*kgem->aperture_mappable/4 || kgem->has_wc_mmap) 516603b705cfSriastradh flags |= KGEM_CAN_CREATE_GTT; 516703b705cfSriastradh if (size > kgem->large_object_size) 516803b705cfSriastradh flags |= KGEM_CAN_CREATE_LARGE; 516903b705cfSriastradh if (size > kgem->max_object_size) { 517003b705cfSriastradh DBG(("%s: too large (untiled) %d > %d\n", 517103b705cfSriastradh __FUNCTION__, size, kgem->max_object_size)); 517203b705cfSriastradh return 0; 517303b705cfSriastradh } 517403b705cfSriastradh } 517503b705cfSriastradh 517603b705cfSriastradh tiling = kgem_choose_tiling(kgem, I915_TILING_X, 517703b705cfSriastradh width, height, bpp); 517803b705cfSriastradh if (tiling != I915_TILING_NONE) { 517903b705cfSriastradh size = kgem_surface_size(kgem, false, 0, 518003b705cfSriastradh width, height, bpp, tiling, 518103b705cfSriastradh &pitch); 518203b705cfSriastradh DBG(("%s: tiled[%d] size=%d\n", __FUNCTION__, tiling, size)); 518303b705cfSriastradh if (size > 0 && size <= kgem->max_gpu_size) 51849a906b70Schristos flags |= KGEM_CAN_CREATE_GPU | KGEM_CAN_CREATE_TILED; 51859a906b70Schristos if (size > 0 && size <= PAGE_SIZE*kgem->aperture_mappable/4) 518603b705cfSriastradh flags |= KGEM_CAN_CREATE_GTT; 51879a906b70Schristos if (size > PAGE_SIZE*kgem->aperture_mappable/4) 51889a906b70Schristos flags &= ~KGEM_CAN_CREATE_GTT; 518903b705cfSriastradh if (size > kgem->large_object_size) 519003b705cfSriastradh flags |= KGEM_CAN_CREATE_LARGE; 519103b705cfSriastradh if (size > kgem->max_object_size) { 519203b705cfSriastradh DBG(("%s: too large (tiled) %d > %d\n", 519303b705cfSriastradh __FUNCTION__, size, kgem->max_object_size)); 519403b705cfSriastradh return 0; 519503b705cfSriastradh } 51969a906b70Schristos if (kgem->gen < 040) { 51979a906b70Schristos int fence_size = 1024 * 1024; 51989a906b70Schristos while (fence_size < size) 51999a906b70Schristos fence_size <<= 1; 52009a906b70Schristos if (fence_size > kgem->max_gpu_size) 52019a906b70Schristos flags &= ~KGEM_CAN_CREATE_GPU | KGEM_CAN_CREATE_TILED; 52029a906b70Schristos if (fence_size > PAGE_SIZE*kgem->aperture_fenceable/4) 52039a906b70Schristos flags &= ~KGEM_CAN_CREATE_GTT; 52049a906b70Schristos } 520503b705cfSriastradh } 520603b705cfSriastradh 520703b705cfSriastradh return flags; 520803b705cfSriastradh} 520903b705cfSriastradh 521003b705cfSriastradhinline int kgem_bo_fenced_size(struct kgem *kgem, struct kgem_bo *bo) 521103b705cfSriastradh{ 521203b705cfSriastradh unsigned int size; 521303b705cfSriastradh 521403b705cfSriastradh assert(bo->tiling); 521503b705cfSriastradh assert_tiling(kgem, bo); 521603b705cfSriastradh assert(kgem->gen < 040); 521703b705cfSriastradh 521803b705cfSriastradh if (kgem->gen < 030) 52199a906b70Schristos size = 512 * 1024 / PAGE_SIZE; 522003b705cfSriastradh else 52219a906b70Schristos size = 1024 * 1024 / PAGE_SIZE; 52229a906b70Schristos while (size < num_pages(bo)) 52239a906b70Schristos size <<= 1; 522403b705cfSriastradh 522503b705cfSriastradh return size; 522603b705cfSriastradh} 522703b705cfSriastradh 522803b705cfSriastradhstatic struct kgem_bo * 522903b705cfSriastradh__kgem_bo_create_as_display(struct kgem *kgem, int size, int tiling, int pitch) 523003b705cfSriastradh{ 523103b705cfSriastradh struct local_i915_gem_create2 args; 523203b705cfSriastradh struct kgem_bo *bo; 523303b705cfSriastradh 523403b705cfSriastradh if (!kgem->has_create2) 523503b705cfSriastradh return NULL; 523603b705cfSriastradh 523703b705cfSriastradh memset(&args, 0, sizeof(args)); 523803b705cfSriastradh args.size = size * PAGE_SIZE; 523903b705cfSriastradh args.placement = LOCAL_I915_CREATE_PLACEMENT_STOLEN; 524003b705cfSriastradh args.caching = DISPLAY; 524103b705cfSriastradh args.tiling_mode = tiling; 524203b705cfSriastradh args.stride = pitch; 524303b705cfSriastradh 52449a906b70Schristos if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_CREATE2, &args)) { 524503b705cfSriastradh args.placement = LOCAL_I915_CREATE_PLACEMENT_SYSTEM; 52469a906b70Schristos if (do_ioctl(kgem->fd, LOCAL_IOCTL_I915_GEM_CREATE2, &args)) 524703b705cfSriastradh return NULL; 524803b705cfSriastradh } 524903b705cfSriastradh 525003b705cfSriastradh bo = __kgem_bo_alloc(args.handle, size); 525103b705cfSriastradh if (bo == NULL) { 525203b705cfSriastradh gem_close(kgem->fd, args.handle); 525303b705cfSriastradh return NULL; 525403b705cfSriastradh } 525503b705cfSriastradh 525603b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 525703b705cfSriastradh bo->tiling = tiling; 525803b705cfSriastradh bo->pitch = pitch; 525903b705cfSriastradh if (args.placement == LOCAL_I915_CREATE_PLACEMENT_STOLEN) { 526003b705cfSriastradh bo->purged = true; /* for asserts against CPU access */ 526103b705cfSriastradh } 526203b705cfSriastradh bo->reusable = false; /* so that unclaimed scanouts are freed */ 526303b705cfSriastradh bo->domain = DOMAIN_NONE; 526403b705cfSriastradh 526503b705cfSriastradh if (__kgem_busy(kgem, bo->handle)) { 52669a906b70Schristos assert(bo->exec == NULL); 526703b705cfSriastradh list_add(&bo->request, &kgem->flushing); 526803b705cfSriastradh bo->rq = (void *)kgem; 52699a906b70Schristos kgem->need_retire = true; 527003b705cfSriastradh } 527103b705cfSriastradh 527203b705cfSriastradh assert_tiling(kgem, bo); 527303b705cfSriastradh debug_alloc__bo(kgem, bo); 527403b705cfSriastradh 527503b705cfSriastradh return bo; 527603b705cfSriastradh} 527703b705cfSriastradh 52789a906b70Schristosstatic void __kgem_bo_make_scanout(struct kgem *kgem, 52799a906b70Schristos struct kgem_bo *bo, 52809a906b70Schristos int width, int height) 52819a906b70Schristos{ 528263ef14f0Smrg ScrnInfoPtr scrn = __to_sna(kgem)->scrn; 52839a906b70Schristos struct drm_mode_fb_cmd arg; 52849a906b70Schristos 52859a906b70Schristos assert(bo->proxy == NULL); 52869a906b70Schristos 52879a906b70Schristos if (!scrn->vtSema) 52889a906b70Schristos return; 52899a906b70Schristos 52909a906b70Schristos DBG(("%s: create fb %dx%d@%d/%d\n", 52919a906b70Schristos __FUNCTION__, width, height, scrn->depth, scrn->bitsPerPixel)); 52929a906b70Schristos 52939a906b70Schristos VG_CLEAR(arg); 52949a906b70Schristos arg.width = width; 52959a906b70Schristos arg.height = height; 52969a906b70Schristos arg.pitch = bo->pitch; 52979a906b70Schristos arg.bpp = scrn->bitsPerPixel; 52989a906b70Schristos arg.depth = scrn->depth; 52999a906b70Schristos arg.handle = bo->handle; 53009a906b70Schristos 53019a906b70Schristos /* First move the scanout out of cached memory */ 53029a906b70Schristos if (kgem->has_llc) { 53039a906b70Schristos if (!gem_set_caching(kgem->fd, bo->handle, DISPLAY) && 53049a906b70Schristos !gem_set_caching(kgem->fd, bo->handle, UNCACHED)) 53059a906b70Schristos return; 53069a906b70Schristos } 53079a906b70Schristos 53089a906b70Schristos bo->scanout = true; 53099a906b70Schristos 53109a906b70Schristos /* Then pre-emptively move the object into the mappable 53119a906b70Schristos * portion to avoid rebinding later when busy. 53129a906b70Schristos */ 53139a906b70Schristos if (bo->map__gtt == NULL) 53149a906b70Schristos bo->map__gtt = __kgem_bo_map__gtt(kgem, bo); 53159a906b70Schristos if (bo->map__gtt) { 5316813957e3Ssnj if (sigtrap_get() == 0) { 5317813957e3Ssnj *(uint32_t *)bo->map__gtt = 0; 5318813957e3Ssnj sigtrap_put(); 5319813957e3Ssnj } 53209a906b70Schristos bo->domain = DOMAIN_GTT; 53219a906b70Schristos } 53229a906b70Schristos 53239a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &arg) == 0) { 53249a906b70Schristos DBG(("%s: attached fb=%d to handle=%d\n", 53259a906b70Schristos __FUNCTION__, arg.fb_id, arg.handle)); 53269a906b70Schristos bo->delta = arg.fb_id; 53279a906b70Schristos } 53289a906b70Schristos} 53299a906b70Schristos 533063ef14f0Smrgstatic bool tiling_changed(struct kgem_bo *bo, int tiling, int pitch) 533163ef14f0Smrg{ 533263ef14f0Smrg if (tiling != bo->tiling) 533363ef14f0Smrg return true; 533463ef14f0Smrg 533563ef14f0Smrg return tiling != I915_TILING_NONE && pitch != bo->pitch; 533663ef14f0Smrg} 533763ef14f0Smrg 533863ef14f0Smrgstatic void set_gpu_tiling(struct kgem *kgem, 533963ef14f0Smrg struct kgem_bo *bo, 534063ef14f0Smrg int tiling, int pitch) 534163ef14f0Smrg{ 534263ef14f0Smrg DBG(("%s: handle=%d, tiling=%d, pitch=%d\n", 534363ef14f0Smrg __FUNCTION__, bo->handle, tiling, pitch)); 534463ef14f0Smrg 534563ef14f0Smrg if (tiling_changed(bo, tiling, pitch) && bo->map__gtt) { 534663ef14f0Smrg if (!list_is_empty(&bo->vma)) { 534763ef14f0Smrg list_del(&bo->vma); 534863ef14f0Smrg kgem->vma[0].count--; 534963ef14f0Smrg } 535063ef14f0Smrg munmap(bo->map__gtt, bytes(bo)); 535163ef14f0Smrg bo->map__gtt = NULL; 535263ef14f0Smrg } 535363ef14f0Smrg 535463ef14f0Smrg bo->tiling = tiling; 535563ef14f0Smrg bo->pitch = pitch; 535663ef14f0Smrg} 535763ef14f0Smrg 535863ef14f0Smrgbool kgem_bo_is_fenced(struct kgem *kgem, struct kgem_bo *bo) 535963ef14f0Smrg{ 536063ef14f0Smrg struct drm_i915_gem_get_tiling tiling; 536163ef14f0Smrg 536263ef14f0Smrg assert(kgem); 536363ef14f0Smrg assert(bo); 536463ef14f0Smrg 536563ef14f0Smrg VG_CLEAR(tiling); 536663ef14f0Smrg tiling.handle = bo->handle; 536763ef14f0Smrg tiling.tiling_mode = bo->tiling; 536863ef14f0Smrg (void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_TILING, &tiling); 536963ef14f0Smrg return tiling.tiling_mode == bo->tiling; /* assume pitch is fine! */ 537063ef14f0Smrg} 537163ef14f0Smrg 537203b705cfSriastradhstruct kgem_bo *kgem_create_2d(struct kgem *kgem, 537303b705cfSriastradh int width, 537403b705cfSriastradh int height, 537503b705cfSriastradh int bpp, 537603b705cfSriastradh int tiling, 537703b705cfSriastradh uint32_t flags) 537803b705cfSriastradh{ 537903b705cfSriastradh struct list *cache; 538003b705cfSriastradh struct kgem_bo *bo; 538103b705cfSriastradh uint32_t pitch, tiled_height, size; 538203b705cfSriastradh uint32_t handle; 538303b705cfSriastradh int i, bucket, retry; 538403b705cfSriastradh bool exact = flags & (CREATE_EXACT | CREATE_SCANOUT); 538503b705cfSriastradh 538603b705cfSriastradh if (tiling < 0) 538703b705cfSriastradh exact = true, tiling = -tiling; 538803b705cfSriastradh 538903b705cfSriastradh DBG(("%s(%dx%d, bpp=%d, tiling=%d, exact=%d, inactive=%d, cpu-mapping=%d, gtt-mapping=%d, scanout?=%d, prime?=%d, temp?=%d)\n", __FUNCTION__, 539003b705cfSriastradh width, height, bpp, tiling, exact, 539103b705cfSriastradh !!(flags & CREATE_INACTIVE), 539203b705cfSriastradh !!(flags & CREATE_CPU_MAP), 539303b705cfSriastradh !!(flags & CREATE_GTT_MAP), 539403b705cfSriastradh !!(flags & CREATE_SCANOUT), 539503b705cfSriastradh !!(flags & CREATE_PRIME), 539603b705cfSriastradh !!(flags & CREATE_TEMPORARY))); 539703b705cfSriastradh 539803b705cfSriastradh size = kgem_surface_size(kgem, kgem->has_relaxed_fencing, flags, 539903b705cfSriastradh width, height, bpp, tiling, &pitch); 54009a906b70Schristos if (size == 0) { 54019a906b70Schristos DBG(("%s: invalid surface size (too large?)\n", __FUNCTION__)); 54029a906b70Schristos return NULL; 54039a906b70Schristos } 54049a906b70Schristos 540503b705cfSriastradh size /= PAGE_SIZE; 540603b705cfSriastradh bucket = cache_bucket(size); 540703b705cfSriastradh 540803b705cfSriastradh if (flags & CREATE_SCANOUT) { 540903b705cfSriastradh struct kgem_bo *last = NULL; 541003b705cfSriastradh 541103b705cfSriastradh list_for_each_entry_reverse(bo, &kgem->scanout, list) { 541203b705cfSriastradh assert(bo->scanout); 541303b705cfSriastradh assert(!bo->flush); 54149a906b70Schristos assert(!bo->refcnt); 541503b705cfSriastradh assert_tiling(kgem, bo); 541603b705cfSriastradh 541703b705cfSriastradh if (size > num_pages(bo) || num_pages(bo) > 2*size) 541803b705cfSriastradh continue; 541903b705cfSriastradh 54209a906b70Schristos if (bo->tiling != tiling || bo->pitch != pitch) 54219a906b70Schristos /* No tiling/pitch without recreating fb */ 542203b705cfSriastradh continue; 542303b705cfSriastradh 54249a906b70Schristos if (bo->delta && !check_scanout_size(kgem, bo, width, height)) 542563ef14f0Smrg kgem_bo_rmfb(kgem, bo); 542603b705cfSriastradh 542703b705cfSriastradh if (flags & CREATE_INACTIVE && bo->rq) { 542803b705cfSriastradh last = bo; 542903b705cfSriastradh continue; 543003b705cfSriastradh } 543103b705cfSriastradh 543203b705cfSriastradh list_del(&bo->list); 543303b705cfSriastradh 543403b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 543503b705cfSriastradh DBG((" 1:from scanout: pitch=%d, tiling=%d, handle=%d, id=%d\n", 543603b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 543703b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 543803b705cfSriastradh assert_tiling(kgem, bo); 543903b705cfSriastradh bo->refcnt = 1; 544003b705cfSriastradh return bo; 544103b705cfSriastradh } 544203b705cfSriastradh 544303b705cfSriastradh if (last) { 544403b705cfSriastradh list_del(&last->list); 544503b705cfSriastradh 544603b705cfSriastradh last->unique_id = kgem_get_unique_id(kgem); 544703b705cfSriastradh DBG((" 1:from scanout: pitch=%d, tiling=%d, handle=%d, id=%d\n", 544803b705cfSriastradh last->pitch, last->tiling, last->handle, last->unique_id)); 544903b705cfSriastradh assert(last->pitch*kgem_aligned_height(kgem, height, last->tiling) <= kgem_bo_size(last)); 545003b705cfSriastradh assert_tiling(kgem, last); 545103b705cfSriastradh last->refcnt = 1; 545203b705cfSriastradh return last; 545303b705cfSriastradh } 545403b705cfSriastradh 545563ef14f0Smrg if (__to_sna(kgem)->scrn->vtSema) { 545663ef14f0Smrg ScrnInfoPtr scrn = __to_sna(kgem)->scrn; 54579a906b70Schristos 54589a906b70Schristos list_for_each_entry_reverse(bo, &kgem->scanout, list) { 54599a906b70Schristos struct drm_mode_fb_cmd arg; 54609a906b70Schristos 54619a906b70Schristos assert(bo->scanout); 54629a906b70Schristos assert(!bo->refcnt); 54639a906b70Schristos 54649a906b70Schristos if (size > num_pages(bo) || num_pages(bo) > 2*size) 54659a906b70Schristos continue; 54669a906b70Schristos 54679a906b70Schristos if (flags & CREATE_INACTIVE && bo->rq) 54689a906b70Schristos continue; 54699a906b70Schristos 54709a906b70Schristos list_del(&bo->list); 54719a906b70Schristos 54729a906b70Schristos if (bo->tiling != tiling || bo->pitch != pitch) { 54739a906b70Schristos if (bo->delta) { 54749a906b70Schristos kgem_bo_rmfb(kgem, bo); 54759a906b70Schristos bo->delta = 0; 54769a906b70Schristos } 54779a906b70Schristos 547863ef14f0Smrg if (!kgem_set_tiling(kgem, bo, 547963ef14f0Smrg tiling, pitch)) { 548063ef14f0Smrg bo->scanout = false; 548163ef14f0Smrg __kgem_bo_destroy(kgem, bo); 54829a906b70Schristos break; 54839a906b70Schristos } 54849a906b70Schristos } 54859a906b70Schristos 54869a906b70Schristos VG_CLEAR(arg); 54879a906b70Schristos arg.width = width; 54889a906b70Schristos arg.height = height; 54899a906b70Schristos arg.pitch = bo->pitch; 54909a906b70Schristos arg.bpp = scrn->bitsPerPixel; 54919a906b70Schristos arg.depth = scrn->depth; 54929a906b70Schristos arg.handle = bo->handle; 54939a906b70Schristos 54949a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_MODE_ADDFB, &arg)) { 549563ef14f0Smrg bo->scanout = false; 549663ef14f0Smrg __kgem_bo_destroy(kgem, bo); 54979a906b70Schristos break; 54989a906b70Schristos } 54999a906b70Schristos 55009a906b70Schristos bo->delta = arg.fb_id; 55019a906b70Schristos bo->unique_id = kgem_get_unique_id(kgem); 55029a906b70Schristos 55039a906b70Schristos DBG((" 2:from scanout: pitch=%d, tiling=%d, handle=%d, id=%d\n", 55049a906b70Schristos bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 55059a906b70Schristos assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 55069a906b70Schristos assert_tiling(kgem, bo); 55079a906b70Schristos bo->refcnt = 1; 55089a906b70Schristos return bo; 55099a906b70Schristos } 55109a906b70Schristos } 55119a906b70Schristos 551263ef14f0Smrg if (flags & CREATE_CACHED) 551363ef14f0Smrg return NULL; 551463ef14f0Smrg 551503b705cfSriastradh bo = __kgem_bo_create_as_display(kgem, size, tiling, pitch); 551603b705cfSriastradh if (bo) 551703b705cfSriastradh return bo; 55189a906b70Schristos 55199a906b70Schristos flags |= CREATE_INACTIVE; 552003b705cfSriastradh } 552103b705cfSriastradh 552203b705cfSriastradh if (bucket >= NUM_CACHE_BUCKETS) { 552303b705cfSriastradh DBG(("%s: large bo num pages=%d, bucket=%d\n", 552403b705cfSriastradh __FUNCTION__, size, bucket)); 552503b705cfSriastradh 552603b705cfSriastradh if (flags & CREATE_INACTIVE) 552703b705cfSriastradh goto large_inactive; 552803b705cfSriastradh 552903b705cfSriastradh tiled_height = kgem_aligned_height(kgem, height, tiling); 553003b705cfSriastradh 553103b705cfSriastradh list_for_each_entry(bo, &kgem->large, list) { 553203b705cfSriastradh assert(!bo->purged); 553303b705cfSriastradh assert(!bo->scanout); 553403b705cfSriastradh assert(bo->refcnt == 0); 553503b705cfSriastradh assert(bo->reusable); 553603b705cfSriastradh assert_tiling(kgem, bo); 553703b705cfSriastradh 553803b705cfSriastradh if (kgem->gen < 040) { 553903b705cfSriastradh if (bo->pitch < pitch) { 554003b705cfSriastradh DBG(("tiled and pitch too small: tiling=%d, (want %d), pitch=%d, need %d\n", 554103b705cfSriastradh bo->tiling, tiling, 554203b705cfSriastradh bo->pitch, pitch)); 554303b705cfSriastradh continue; 554403b705cfSriastradh } 554503b705cfSriastradh 554603b705cfSriastradh if (bo->pitch * tiled_height > bytes(bo)) 554703b705cfSriastradh continue; 554803b705cfSriastradh } else { 554903b705cfSriastradh if (num_pages(bo) < size) 555003b705cfSriastradh continue; 555103b705cfSriastradh 555263ef14f0Smrg if (!kgem_set_tiling(kgem, bo, tiling, pitch)) { 555363ef14f0Smrg if (exact) { 555463ef14f0Smrg DBG(("tiled and pitch not exact: tiling=%d, (want %d), pitch=%d, need %d\n", 555563ef14f0Smrg bo->tiling, tiling, 555663ef14f0Smrg bo->pitch, pitch)); 555703b705cfSriastradh continue; 555863ef14f0Smrg } 555903b705cfSriastradh 556063ef14f0Smrg set_gpu_tiling(kgem, bo, tiling, pitch); 556103b705cfSriastradh } 556203b705cfSriastradh } 556303b705cfSriastradh 556403b705cfSriastradh kgem_bo_remove_from_active(kgem, bo); 556503b705cfSriastradh 556603b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 556703b705cfSriastradh bo->delta = 0; 556803b705cfSriastradh DBG((" 1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n", 556903b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 557003b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 557103b705cfSriastradh assert_tiling(kgem, bo); 557203b705cfSriastradh bo->refcnt = 1; 557303b705cfSriastradh return bo; 557403b705cfSriastradh } 557503b705cfSriastradh 557603b705cfSriastradhlarge_inactive: 557703b705cfSriastradh __kgem_throttle_retire(kgem, flags); 557803b705cfSriastradh list_for_each_entry(bo, &kgem->large_inactive, list) { 557903b705cfSriastradh assert(bo->refcnt == 0); 558003b705cfSriastradh assert(bo->reusable); 558103b705cfSriastradh assert(!bo->scanout); 558203b705cfSriastradh assert_tiling(kgem, bo); 558303b705cfSriastradh 558403b705cfSriastradh if (size > num_pages(bo)) 558503b705cfSriastradh continue; 558603b705cfSriastradh 558763ef14f0Smrg if (!kgem_set_tiling(kgem, bo, tiling, pitch)) { 558863ef14f0Smrg if (kgem->gen >= 040 && !exact) 558963ef14f0Smrg set_gpu_tiling(kgem, bo, tiling, pitch); 559063ef14f0Smrg else 559103b705cfSriastradh continue; 559203b705cfSriastradh } 559303b705cfSriastradh 559403b705cfSriastradh if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) { 559503b705cfSriastradh kgem_bo_free(kgem, bo); 559603b705cfSriastradh break; 559703b705cfSriastradh } 559803b705cfSriastradh 559903b705cfSriastradh list_del(&bo->list); 560003b705cfSriastradh 560103b705cfSriastradh assert(bo->domain != DOMAIN_GPU); 560203b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 560303b705cfSriastradh bo->delta = 0; 560403b705cfSriastradh DBG((" 1:from large inactive: pitch=%d, tiling=%d, handle=%d, id=%d\n", 560503b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 560603b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 560703b705cfSriastradh assert_tiling(kgem, bo); 560803b705cfSriastradh bo->refcnt = 1; 56099a906b70Schristos 56109a906b70Schristos if (flags & CREATE_SCANOUT) 56119a906b70Schristos __kgem_bo_make_scanout(kgem, bo, width, height); 56129a906b70Schristos 561303b705cfSriastradh return bo; 561403b705cfSriastradh } 561503b705cfSriastradh 561603b705cfSriastradh goto create; 561703b705cfSriastradh } 561803b705cfSriastradh 561903b705cfSriastradh if (flags & (CREATE_CPU_MAP | CREATE_GTT_MAP)) { 562003b705cfSriastradh int for_cpu = !!(flags & CREATE_CPU_MAP); 562103b705cfSriastradh if (kgem->has_llc && tiling == I915_TILING_NONE) 562203b705cfSriastradh for_cpu = 1; 562303b705cfSriastradh /* We presume that we will need to upload to this bo, 562403b705cfSriastradh * and so would prefer to have an active VMA. 562503b705cfSriastradh */ 562603b705cfSriastradh cache = &kgem->vma[for_cpu].inactive[bucket]; 562703b705cfSriastradh do { 562803b705cfSriastradh list_for_each_entry(bo, cache, vma) { 562903b705cfSriastradh assert(bucket(bo) == bucket); 563003b705cfSriastradh assert(bo->refcnt == 0); 563103b705cfSriastradh assert(!bo->scanout); 5632813957e3Ssnj assert(for_cpu ? !!bo->map__cpu : (bo->map__gtt || bo->map__wc)); 563303b705cfSriastradh assert(bo->rq == NULL); 56349a906b70Schristos assert(bo->exec == NULL); 563503b705cfSriastradh assert(list_is_empty(&bo->request)); 563603b705cfSriastradh assert(bo->flush == false); 563703b705cfSriastradh assert_tiling(kgem, bo); 563803b705cfSriastradh 563903b705cfSriastradh if (size > num_pages(bo)) { 564003b705cfSriastradh DBG(("inactive too small: %d < %d\n", 564103b705cfSriastradh num_pages(bo), size)); 564203b705cfSriastradh continue; 564303b705cfSriastradh } 564403b705cfSriastradh 56459a906b70Schristos if (flags & UNCACHED && !kgem->has_llc && bo->domain != DOMAIN_CPU) 56469a906b70Schristos continue; 56479a906b70Schristos 564803b705cfSriastradh if (bo->tiling != tiling || 564903b705cfSriastradh (tiling != I915_TILING_NONE && bo->pitch != pitch)) { 56509a906b70Schristos if (bo->map__gtt || 565163ef14f0Smrg !kgem_set_tiling(kgem, bo, 565263ef14f0Smrg tiling, pitch)) { 56539a906b70Schristos DBG(("inactive GTT vma with wrong tiling: %d < %d\n", 56549a906b70Schristos bo->tiling, tiling)); 565563ef14f0Smrg kgem_bo_free(kgem, bo); 565663ef14f0Smrg break; 56579a906b70Schristos } 565803b705cfSriastradh } 565903b705cfSriastradh 566003b705cfSriastradh if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) { 566103b705cfSriastradh kgem_bo_free(kgem, bo); 566203b705cfSriastradh break; 566303b705cfSriastradh } 566403b705cfSriastradh 566563ef14f0Smrg if (tiling == I915_TILING_NONE) 566663ef14f0Smrg bo->pitch = pitch; 566763ef14f0Smrg 566803b705cfSriastradh assert(bo->tiling == tiling); 566963ef14f0Smrg assert(bo->pitch >= pitch); 567003b705cfSriastradh bo->delta = 0; 567103b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 567203b705cfSriastradh 567303b705cfSriastradh kgem_bo_remove_from_inactive(kgem, bo); 56749a906b70Schristos assert(list_is_empty(&bo->list)); 56759a906b70Schristos assert(list_is_empty(&bo->vma)); 567603b705cfSriastradh 567703b705cfSriastradh DBG((" from inactive vma: pitch=%d, tiling=%d: handle=%d, id=%d\n", 567803b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 567903b705cfSriastradh assert(bo->reusable); 568003b705cfSriastradh assert(bo->domain != DOMAIN_GPU); 568103b705cfSriastradh ASSERT_IDLE(kgem, bo->handle); 568203b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 568303b705cfSriastradh assert_tiling(kgem, bo); 568403b705cfSriastradh bo->refcnt = 1; 568503b705cfSriastradh return bo; 568603b705cfSriastradh } 568703b705cfSriastradh } while (!list_is_empty(cache) && 568803b705cfSriastradh __kgem_throttle_retire(kgem, flags)); 568903b705cfSriastradh 569003b705cfSriastradh if (flags & CREATE_CPU_MAP && !kgem->has_llc) { 569103b705cfSriastradh if (list_is_empty(&kgem->active[bucket][tiling]) && 569203b705cfSriastradh list_is_empty(&kgem->inactive[bucket])) 569303b705cfSriastradh flags &= ~CREATE_CACHED; 569403b705cfSriastradh 569503b705cfSriastradh goto create; 569603b705cfSriastradh } 569703b705cfSriastradh } 569803b705cfSriastradh 569903b705cfSriastradh if (flags & CREATE_INACTIVE) 570003b705cfSriastradh goto skip_active_search; 570103b705cfSriastradh 570203b705cfSriastradh /* Best active match */ 570303b705cfSriastradh retry = NUM_CACHE_BUCKETS - bucket; 570403b705cfSriastradh if (retry > 3 && (flags & CREATE_TEMPORARY) == 0) 570503b705cfSriastradh retry = 3; 57069a906b70Schristossearch_active: 570703b705cfSriastradh assert(bucket < NUM_CACHE_BUCKETS); 570803b705cfSriastradh cache = &kgem->active[bucket][tiling]; 570903b705cfSriastradh if (tiling) { 571003b705cfSriastradh tiled_height = kgem_aligned_height(kgem, height, tiling); 571103b705cfSriastradh list_for_each_entry(bo, cache, list) { 571203b705cfSriastradh assert(!bo->purged); 571303b705cfSriastradh assert(bo->refcnt == 0); 571403b705cfSriastradh assert(bucket(bo) == bucket); 571503b705cfSriastradh assert(bo->reusable); 571603b705cfSriastradh assert(bo->tiling == tiling); 571703b705cfSriastradh assert(bo->flush == false); 571803b705cfSriastradh assert(!bo->scanout); 571903b705cfSriastradh assert_tiling(kgem, bo); 572003b705cfSriastradh 572103b705cfSriastradh if (kgem->gen < 040) { 572203b705cfSriastradh if (bo->pitch < pitch) { 572303b705cfSriastradh DBG(("tiled and pitch too small: tiling=%d, (want %d), pitch=%d, need %d\n", 572403b705cfSriastradh bo->tiling, tiling, 572503b705cfSriastradh bo->pitch, pitch)); 572603b705cfSriastradh continue; 572703b705cfSriastradh } 572803b705cfSriastradh 572903b705cfSriastradh if (bo->pitch * tiled_height > bytes(bo)) 573003b705cfSriastradh continue; 573103b705cfSriastradh } else { 573203b705cfSriastradh if (num_pages(bo) < size) 573303b705cfSriastradh continue; 573403b705cfSriastradh 573563ef14f0Smrg if (!kgem_set_tiling(kgem, bo, tiling, pitch)) { 573663ef14f0Smrg if (exact) { 573763ef14f0Smrg DBG(("tiled and pitch not exact: tiling=%d, (want %d), pitch=%d, need %d\n", 573863ef14f0Smrg bo->tiling, tiling, 573963ef14f0Smrg bo->pitch, pitch)); 574003b705cfSriastradh continue; 574163ef14f0Smrg } 574203b705cfSriastradh 574363ef14f0Smrg set_gpu_tiling(kgem, bo, tiling, pitch); 574403b705cfSriastradh } 574503b705cfSriastradh } 574663ef14f0Smrg assert(bo->tiling == tiling); 574763ef14f0Smrg assert(bo->pitch >= pitch); 574803b705cfSriastradh 574903b705cfSriastradh kgem_bo_remove_from_active(kgem, bo); 575003b705cfSriastradh 575103b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 575203b705cfSriastradh bo->delta = 0; 575303b705cfSriastradh DBG((" 1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n", 575403b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 575503b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 575603b705cfSriastradh assert_tiling(kgem, bo); 575703b705cfSriastradh bo->refcnt = 1; 575803b705cfSriastradh return bo; 575903b705cfSriastradh } 576003b705cfSriastradh } else { 576103b705cfSriastradh list_for_each_entry(bo, cache, list) { 576203b705cfSriastradh assert(bucket(bo) == bucket); 576303b705cfSriastradh assert(!bo->purged); 576403b705cfSriastradh assert(bo->refcnt == 0); 576503b705cfSriastradh assert(bo->reusable); 576603b705cfSriastradh assert(!bo->scanout); 576703b705cfSriastradh assert(bo->tiling == tiling); 576803b705cfSriastradh assert(bo->flush == false); 576903b705cfSriastradh assert_tiling(kgem, bo); 577003b705cfSriastradh 577103b705cfSriastradh if (num_pages(bo) < size) 577203b705cfSriastradh continue; 577303b705cfSriastradh 577403b705cfSriastradh kgem_bo_remove_from_active(kgem, bo); 577503b705cfSriastradh 577603b705cfSriastradh bo->pitch = pitch; 577703b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 577803b705cfSriastradh bo->delta = 0; 577903b705cfSriastradh DBG((" 1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n", 578003b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 578103b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 578203b705cfSriastradh assert_tiling(kgem, bo); 578303b705cfSriastradh bo->refcnt = 1; 578403b705cfSriastradh return bo; 578503b705cfSriastradh } 578603b705cfSriastradh } 578703b705cfSriastradh 57889a906b70Schristos if (kgem->gen >= 040) { 57899a906b70Schristos for (i = I915_TILING_Y; i >= I915_TILING_NONE; i--) { 57909a906b70Schristos cache = &kgem->active[bucket][i]; 57919a906b70Schristos list_for_each_entry(bo, cache, list) { 57929a906b70Schristos assert(!bo->purged); 57939a906b70Schristos assert(bo->refcnt == 0); 57949a906b70Schristos assert(bo->reusable); 57959a906b70Schristos assert(!bo->scanout); 57969a906b70Schristos assert(bo->flush == false); 57979a906b70Schristos assert_tiling(kgem, bo); 579803b705cfSriastradh 57999a906b70Schristos if (num_pages(bo) < size) 58009a906b70Schristos continue; 580103b705cfSriastradh 580263ef14f0Smrg if (!kgem_set_tiling(kgem, bo, tiling, pitch)) { 580363ef14f0Smrg if (exact || kgem->gen < 040) 580403b705cfSriastradh continue; 580563ef14f0Smrg 580663ef14f0Smrg set_gpu_tiling(kgem, bo, tiling, pitch); 58079a906b70Schristos } 580863ef14f0Smrg assert(bo->tiling == tiling); 580963ef14f0Smrg assert(bo->pitch >= pitch); 581003b705cfSriastradh 58119a906b70Schristos kgem_bo_remove_from_active(kgem, bo); 581203b705cfSriastradh 58139a906b70Schristos bo->unique_id = kgem_get_unique_id(kgem); 58149a906b70Schristos bo->delta = 0; 58159a906b70Schristos DBG((" 1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n", 58169a906b70Schristos bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 58179a906b70Schristos assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 58189a906b70Schristos assert_tiling(kgem, bo); 58199a906b70Schristos bo->refcnt = 1; 58209a906b70Schristos return bo; 582103b705cfSriastradh } 582203b705cfSriastradh } 58239a906b70Schristos } else if (!exact) { /* allow an active near-miss? */ 58249a906b70Schristos for (i = tiling; i >= I915_TILING_NONE; i--) { 582503b705cfSriastradh tiled_height = kgem_surface_size(kgem, kgem->has_relaxed_fencing, flags, 582603b705cfSriastradh width, height, bpp, tiling, &pitch); 582703b705cfSriastradh cache = active(kgem, tiled_height / PAGE_SIZE, i); 582803b705cfSriastradh tiled_height = kgem_aligned_height(kgem, height, i); 582903b705cfSriastradh list_for_each_entry(bo, cache, list) { 583003b705cfSriastradh assert(!bo->purged); 583103b705cfSriastradh assert(bo->refcnt == 0); 583203b705cfSriastradh assert(bo->reusable); 583303b705cfSriastradh assert(!bo->scanout); 583403b705cfSriastradh assert(bo->flush == false); 583503b705cfSriastradh assert_tiling(kgem, bo); 583603b705cfSriastradh 583703b705cfSriastradh if (bo->tiling) { 583803b705cfSriastradh if (bo->pitch < pitch) { 583903b705cfSriastradh DBG(("tiled and pitch too small: tiling=%d, (want %d), pitch=%d, need %d\n", 584003b705cfSriastradh bo->tiling, tiling, 584103b705cfSriastradh bo->pitch, pitch)); 584203b705cfSriastradh continue; 584303b705cfSriastradh } 584403b705cfSriastradh } else 584503b705cfSriastradh bo->pitch = pitch; 584603b705cfSriastradh 584703b705cfSriastradh if (bo->pitch * tiled_height > bytes(bo)) 584803b705cfSriastradh continue; 584903b705cfSriastradh 585003b705cfSriastradh kgem_bo_remove_from_active(kgem, bo); 585103b705cfSriastradh 585203b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 585303b705cfSriastradh bo->delta = 0; 585403b705cfSriastradh DBG((" 1:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n", 585503b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 585603b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 585703b705cfSriastradh assert_tiling(kgem, bo); 585803b705cfSriastradh bo->refcnt = 1; 585903b705cfSriastradh return bo; 586003b705cfSriastradh } 586103b705cfSriastradh } 586203b705cfSriastradh } 586303b705cfSriastradh 58649a906b70Schristos if (--retry) { 58659a906b70Schristos bucket++; 58669a906b70Schristos goto search_active; 58679a906b70Schristos } 58689a906b70Schristos 586903b705cfSriastradhskip_active_search: 587003b705cfSriastradh bucket = cache_bucket(size); 587103b705cfSriastradh retry = NUM_CACHE_BUCKETS - bucket; 587203b705cfSriastradh if (retry > 3) 587303b705cfSriastradh retry = 3; 587403b705cfSriastradhsearch_inactive: 587503b705cfSriastradh /* Now just look for a close match and prefer any currently active */ 587603b705cfSriastradh assert(bucket < NUM_CACHE_BUCKETS); 587703b705cfSriastradh cache = &kgem->inactive[bucket]; 587803b705cfSriastradh list_for_each_entry(bo, cache, list) { 587903b705cfSriastradh assert(bucket(bo) == bucket); 588003b705cfSriastradh assert(bo->reusable); 588103b705cfSriastradh assert(!bo->scanout); 588203b705cfSriastradh assert(bo->flush == false); 588303b705cfSriastradh assert_tiling(kgem, bo); 588403b705cfSriastradh 588503b705cfSriastradh if (size > num_pages(bo)) { 588603b705cfSriastradh DBG(("inactive too small: %d < %d\n", 588703b705cfSriastradh num_pages(bo), size)); 588803b705cfSriastradh continue; 588903b705cfSriastradh } 589003b705cfSriastradh 589163ef14f0Smrg if (!kgem_set_tiling(kgem, bo, tiling, pitch)) { 589263ef14f0Smrg if (exact || kgem->gen < 040) { 589363ef14f0Smrg kgem_bo_free(kgem, bo); 589463ef14f0Smrg break; 589563ef14f0Smrg } 589663ef14f0Smrg 589763ef14f0Smrg set_gpu_tiling(kgem, bo, tiling, pitch); 589803b705cfSriastradh } 589903b705cfSriastradh 590003b705cfSriastradh if (bo->purged && !kgem_bo_clear_purgeable(kgem, bo)) { 590103b705cfSriastradh kgem_bo_free(kgem, bo); 590203b705cfSriastradh break; 590303b705cfSriastradh } 590403b705cfSriastradh 590503b705cfSriastradh kgem_bo_remove_from_inactive(kgem, bo); 59069a906b70Schristos assert(list_is_empty(&bo->list)); 59079a906b70Schristos assert(list_is_empty(&bo->vma)); 590863ef14f0Smrg assert(bo->tiling == tiling); 590963ef14f0Smrg assert(bo->pitch >= pitch); 591003b705cfSriastradh 591103b705cfSriastradh bo->delta = 0; 591203b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 591303b705cfSriastradh assert(bo->pitch); 591403b705cfSriastradh DBG((" from inactive: pitch=%d, tiling=%d: handle=%d, id=%d\n", 591503b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 591603b705cfSriastradh assert(bo->refcnt == 0); 591703b705cfSriastradh assert(bo->reusable); 591803b705cfSriastradh assert((flags & CREATE_INACTIVE) == 0 || bo->domain != DOMAIN_GPU); 591903b705cfSriastradh ASSERT_MAYBE_IDLE(kgem, bo->handle, flags & CREATE_INACTIVE); 592003b705cfSriastradh assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 592103b705cfSriastradh assert_tiling(kgem, bo); 592203b705cfSriastradh bo->refcnt = 1; 59239a906b70Schristos 59249a906b70Schristos if (flags & CREATE_SCANOUT) 59259a906b70Schristos __kgem_bo_make_scanout(kgem, bo, width, height); 59269a906b70Schristos 592703b705cfSriastradh return bo; 592803b705cfSriastradh } 592903b705cfSriastradh 59309a906b70Schristos if ((flags & CREATE_NO_RETIRE) == 0) { 59319a906b70Schristos list_for_each_entry_reverse(bo, &kgem->active[bucket][tiling], list) { 59329a906b70Schristos if (bo->exec) 59339a906b70Schristos break; 59349a906b70Schristos 59359a906b70Schristos if (size > num_pages(bo)) 59369a906b70Schristos continue; 59379a906b70Schristos 59389a906b70Schristos if (__kgem_busy(kgem, bo->handle)) { 59399a906b70Schristos if (flags & CREATE_NO_THROTTLE) 59409a906b70Schristos goto no_retire; 59419a906b70Schristos 59429a906b70Schristos do { 59439a906b70Schristos if (!kgem->need_throttle) { 59449a906b70Schristos DBG(("%s: not throttling for active handle=%d\n", __FUNCTION__, bo->handle)); 59459a906b70Schristos goto no_retire; 59469a906b70Schristos } 59479a906b70Schristos 59489a906b70Schristos __kgem_throttle(kgem, false); 59499a906b70Schristos } while (__kgem_busy(kgem, bo->handle)); 59509a906b70Schristos } 59519a906b70Schristos 59529a906b70Schristos DBG(("%s: flushed active handle=%d\n", __FUNCTION__, bo->handle)); 59539a906b70Schristos 59549a906b70Schristos kgem_bo_remove_from_active(kgem, bo); 59559a906b70Schristos __kgem_bo_clear_busy(bo); 59569a906b70Schristos 595763ef14f0Smrg if (!kgem_set_tiling(kgem, bo, tiling, pitch)) { 595863ef14f0Smrg if (exact || kgem->gen < 040) 59599a906b70Schristos goto no_retire; 596063ef14f0Smrg 596163ef14f0Smrg set_gpu_tiling(kgem, bo, tiling, pitch); 59629a906b70Schristos } 596363ef14f0Smrg assert(bo->tiling == tiling); 596463ef14f0Smrg assert(bo->pitch >= pitch); 59659a906b70Schristos 59669a906b70Schristos bo->unique_id = kgem_get_unique_id(kgem); 59679a906b70Schristos bo->delta = 0; 59689a906b70Schristos DBG((" 2:from active: pitch=%d, tiling=%d, handle=%d, id=%d\n", 59699a906b70Schristos bo->pitch, bo->tiling, bo->handle, bo->unique_id)); 59709a906b70Schristos assert(bo->pitch*kgem_aligned_height(kgem, height, bo->tiling) <= kgem_bo_size(bo)); 59719a906b70Schristos assert_tiling(kgem, bo); 59729a906b70Schristos bo->refcnt = 1; 59739a906b70Schristos 59749a906b70Schristos if (flags & CREATE_SCANOUT) 59759a906b70Schristos __kgem_bo_make_scanout(kgem, bo, width, height); 59769a906b70Schristos 59779a906b70Schristos return bo; 59789a906b70Schristos } 59799a906b70Schristosno_retire: 59809a906b70Schristos flags |= CREATE_NO_RETIRE; 598103b705cfSriastradh } 598203b705cfSriastradh 598303b705cfSriastradh if (--retry) { 598403b705cfSriastradh bucket++; 598503b705cfSriastradh goto search_inactive; 598603b705cfSriastradh } 598703b705cfSriastradh 598803b705cfSriastradhcreate: 59899a906b70Schristos if (flags & CREATE_CACHED) { 59909a906b70Schristos DBG(("%s: no cached bo found, requested not to create a new bo\n", __FUNCTION__)); 599103b705cfSriastradh return NULL; 59929a906b70Schristos } 599303b705cfSriastradh 599403b705cfSriastradh if (bucket >= NUM_CACHE_BUCKETS) 599503b705cfSriastradh size = ALIGN(size, 1024); 599603b705cfSriastradh handle = gem_create(kgem->fd, size); 59979a906b70Schristos if (handle == 0) { 59989a906b70Schristos DBG(("%s: kernel allocation (gem_create) failure\n", __FUNCTION__)); 599903b705cfSriastradh return NULL; 60009a906b70Schristos } 600103b705cfSriastradh 600203b705cfSriastradh bo = __kgem_bo_alloc(handle, size); 600303b705cfSriastradh if (!bo) { 60049a906b70Schristos DBG(("%s: malloc failed\n", __FUNCTION__)); 600503b705cfSriastradh gem_close(kgem->fd, handle); 600603b705cfSriastradh return NULL; 600703b705cfSriastradh } 600803b705cfSriastradh 600903b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 601063ef14f0Smrg if (kgem_set_tiling(kgem, bo, tiling, pitch)) { 60119a906b70Schristos if (flags & CREATE_SCANOUT) 60129a906b70Schristos __kgem_bo_make_scanout(kgem, bo, width, height); 601303b705cfSriastradh } else { 601463ef14f0Smrg if (kgem->gen >= 040) { 601563ef14f0Smrg assert(!kgem->can_fence); 601663ef14f0Smrg bo->tiling = tiling; 601763ef14f0Smrg bo->pitch = pitch; 601863ef14f0Smrg } else { 601963ef14f0Smrg if (flags & CREATE_EXACT) { 602063ef14f0Smrg DBG(("%s: failed to set exact tiling (gem_set_tiling)\n", __FUNCTION__)); 602163ef14f0Smrg gem_close(kgem->fd, handle); 602263ef14f0Smrg free(bo); 602363ef14f0Smrg return NULL; 602463ef14f0Smrg } 602503b705cfSriastradh } 602603b705cfSriastradh } 602703b705cfSriastradh 602803b705cfSriastradh assert(bytes(bo) >= bo->pitch * kgem_aligned_height(kgem, height, bo->tiling)); 602903b705cfSriastradh assert_tiling(kgem, bo); 603003b705cfSriastradh 603103b705cfSriastradh debug_alloc__bo(kgem, bo); 603203b705cfSriastradh 603303b705cfSriastradh DBG((" new pitch=%d, tiling=%d, handle=%d, id=%d, num_pages=%d [%d], bucket=%d\n", 603403b705cfSriastradh bo->pitch, bo->tiling, bo->handle, bo->unique_id, 603503b705cfSriastradh size, num_pages(bo), bucket(bo))); 603603b705cfSriastradh return bo; 603703b705cfSriastradh} 603803b705cfSriastradh 603903b705cfSriastradhstruct kgem_bo *kgem_create_cpu_2d(struct kgem *kgem, 604003b705cfSriastradh int width, 604103b705cfSriastradh int height, 604203b705cfSriastradh int bpp, 604303b705cfSriastradh uint32_t flags) 604403b705cfSriastradh{ 604503b705cfSriastradh struct kgem_bo *bo; 604603b705cfSriastradh int stride, size; 604703b705cfSriastradh 604803b705cfSriastradh if (DBG_NO_CPU) 604903b705cfSriastradh return NULL; 605003b705cfSriastradh 605103b705cfSriastradh DBG(("%s(%dx%d, bpp=%d)\n", __FUNCTION__, width, height, bpp)); 605203b705cfSriastradh 605303b705cfSriastradh if (kgem->has_llc) { 605403b705cfSriastradh bo = kgem_create_2d(kgem, width, height, bpp, 605503b705cfSriastradh I915_TILING_NONE, flags); 605603b705cfSriastradh if (bo == NULL) 605703b705cfSriastradh return bo; 605803b705cfSriastradh 605903b705cfSriastradh assert(bo->tiling == I915_TILING_NONE); 606003b705cfSriastradh assert_tiling(kgem, bo); 606103b705cfSriastradh 606203b705cfSriastradh if (kgem_bo_map__cpu(kgem, bo) == NULL) { 606303b705cfSriastradh kgem_bo_destroy(kgem, bo); 606403b705cfSriastradh return NULL; 606503b705cfSriastradh } 606603b705cfSriastradh 606703b705cfSriastradh return bo; 606803b705cfSriastradh } 606903b705cfSriastradh 607003b705cfSriastradh assert(width > 0 && height > 0); 607103b705cfSriastradh stride = ALIGN(width, 2) * bpp >> 3; 607203b705cfSriastradh stride = ALIGN(stride, 4); 607303b705cfSriastradh size = stride * ALIGN(height, 2); 607403b705cfSriastradh assert(size >= PAGE_SIZE); 607503b705cfSriastradh 607603b705cfSriastradh DBG(("%s: %dx%d, %d bpp, stride=%d\n", 607703b705cfSriastradh __FUNCTION__, width, height, bpp, stride)); 607803b705cfSriastradh 607903b705cfSriastradh bo = search_snoop_cache(kgem, NUM_PAGES(size), 0); 608003b705cfSriastradh if (bo) { 608103b705cfSriastradh assert(bo->tiling == I915_TILING_NONE); 608203b705cfSriastradh assert_tiling(kgem, bo); 608303b705cfSriastradh assert(bo->snoop); 608403b705cfSriastradh bo->refcnt = 1; 608503b705cfSriastradh bo->pitch = stride; 608603b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 608703b705cfSriastradh return bo; 608803b705cfSriastradh } 608903b705cfSriastradh 609003b705cfSriastradh if (kgem->has_caching) { 609103b705cfSriastradh bo = kgem_create_linear(kgem, size, flags); 609203b705cfSriastradh if (bo == NULL) 609303b705cfSriastradh return NULL; 609403b705cfSriastradh 609503b705cfSriastradh assert(bo->tiling == I915_TILING_NONE); 609603b705cfSriastradh assert_tiling(kgem, bo); 609703b705cfSriastradh 6098813957e3Ssnj assert(!__kgem_busy(kgem, bo->handle)); 609903b705cfSriastradh if (!gem_set_caching(kgem->fd, bo->handle, SNOOPED)) { 610003b705cfSriastradh kgem_bo_destroy(kgem, bo); 610103b705cfSriastradh return NULL; 610203b705cfSriastradh } 610303b705cfSriastradh bo->snoop = true; 610403b705cfSriastradh 610503b705cfSriastradh if (kgem_bo_map__cpu(kgem, bo) == NULL) { 610603b705cfSriastradh kgem_bo_destroy(kgem, bo); 610703b705cfSriastradh return NULL; 610803b705cfSriastradh } 610903b705cfSriastradh 611003b705cfSriastradh bo->pitch = stride; 611103b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 611203b705cfSriastradh return bo; 611303b705cfSriastradh } 611403b705cfSriastradh 611503b705cfSriastradh if (kgem->has_userptr) { 611603b705cfSriastradh void *ptr; 611703b705cfSriastradh 611803b705cfSriastradh /* XXX */ 611903b705cfSriastradh //if (posix_memalign(&ptr, 64, ALIGN(size, 64))) 612003b705cfSriastradh if (posix_memalign(&ptr, PAGE_SIZE, ALIGN(size, PAGE_SIZE))) 612103b705cfSriastradh return NULL; 612203b705cfSriastradh 612303b705cfSriastradh bo = kgem_create_map(kgem, ptr, size, false); 612403b705cfSriastradh if (bo == NULL) { 612503b705cfSriastradh free(ptr); 612603b705cfSriastradh return NULL; 612703b705cfSriastradh } 612803b705cfSriastradh 612903b705cfSriastradh bo->pitch = stride; 613003b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 613103b705cfSriastradh return bo; 613203b705cfSriastradh } 613303b705cfSriastradh 613403b705cfSriastradh return NULL; 613503b705cfSriastradh} 613603b705cfSriastradh 613703b705cfSriastradhvoid _kgem_bo_destroy(struct kgem *kgem, struct kgem_bo *bo) 613803b705cfSriastradh{ 613903b705cfSriastradh DBG(("%s: handle=%d, proxy? %d\n", 614003b705cfSriastradh __FUNCTION__, bo->handle, bo->proxy != NULL)); 614103b705cfSriastradh 614203b705cfSriastradh if (bo->proxy) { 61439a906b70Schristos assert(!bo->reusable); 61449a906b70Schristos kgem_bo_binding_free(kgem, bo); 61459a906b70Schristos 61469a906b70Schristos assert(list_is_empty(&bo->list)); 614703b705cfSriastradh _list_del(&bo->vma); 614803b705cfSriastradh _list_del(&bo->request); 61499a906b70Schristos 61509a906b70Schristos if (bo->io && bo->domain == DOMAIN_CPU) 615103b705cfSriastradh _kgem_bo_delete_buffer(kgem, bo); 61529a906b70Schristos 615303b705cfSriastradh kgem_bo_unref(kgem, bo->proxy); 615403b705cfSriastradh 61559a906b70Schristos if (DBG_NO_MALLOC_CACHE) { 61569a906b70Schristos free(bo); 61579a906b70Schristos } else { 61589a906b70Schristos *(struct kgem_bo **)bo = __kgem_freed_bo; 61599a906b70Schristos __kgem_freed_bo = bo; 61609a906b70Schristos } 61619a906b70Schristos } else 61629a906b70Schristos __kgem_bo_destroy(kgem, bo); 616303b705cfSriastradh} 616403b705cfSriastradh 616503b705cfSriastradhstatic void __kgem_flush(struct kgem *kgem, struct kgem_bo *bo) 616603b705cfSriastradh{ 616703b705cfSriastradh assert(bo->rq); 616803b705cfSriastradh assert(bo->exec == NULL); 616903b705cfSriastradh assert(bo->needs_flush); 617003b705cfSriastradh 617103b705cfSriastradh /* The kernel will emit a flush *and* update its own flushing lists. */ 617203b705cfSriastradh if (!__kgem_busy(kgem, bo->handle)) 617303b705cfSriastradh __kgem_bo_clear_busy(bo); 617403b705cfSriastradh 617503b705cfSriastradh DBG(("%s: handle=%d, busy?=%d\n", 617603b705cfSriastradh __FUNCTION__, bo->handle, bo->rq != NULL)); 617703b705cfSriastradh} 617803b705cfSriastradh 617903b705cfSriastradhvoid kgem_scanout_flush(struct kgem *kgem, struct kgem_bo *bo) 618003b705cfSriastradh{ 618163ef14f0Smrg if (!bo->needs_flush && !bo->gtt_dirty) 618203b705cfSriastradh return; 618303b705cfSriastradh 61849a906b70Schristos kgem_bo_submit(kgem, bo); 61859a906b70Schristos 618603b705cfSriastradh /* If the kernel fails to emit the flush, then it will be forced when 618703b705cfSriastradh * we assume direct access. And as the usual failure is EIO, we do 618803b705cfSriastradh * not actually care. 618903b705cfSriastradh */ 619003b705cfSriastradh assert(bo->exec == NULL); 619103b705cfSriastradh if (bo->rq) 619203b705cfSriastradh __kgem_flush(kgem, bo); 619303b705cfSriastradh 619463ef14f0Smrg if (bo->scanout && kgem->needs_dirtyfb) { 619563ef14f0Smrg struct drm_mode_fb_dirty_cmd cmd; 619663ef14f0Smrg memset(&cmd, 0, sizeof(cmd)); 619763ef14f0Smrg cmd.fb_id = bo->delta; 619863ef14f0Smrg (void)drmIoctl(kgem->fd, DRM_IOCTL_MODE_DIRTYFB, &cmd); 619963ef14f0Smrg } 620063ef14f0Smrg 620103b705cfSriastradh /* Whatever actually happens, we can regard the GTT write domain 620203b705cfSriastradh * as being flushed. 620303b705cfSriastradh */ 620463ef14f0Smrg __kgem_bo_clear_dirty(bo); 620503b705cfSriastradh} 620603b705cfSriastradh 62079a906b70Schristosinline static bool nearly_idle(struct kgem *kgem) 62089a906b70Schristos{ 62099a906b70Schristos int ring = kgem->ring == KGEM_BLT; 62109a906b70Schristos 621163ef14f0Smrg assert(ring < ARRAY_SIZE(kgem->requests)); 62129a906b70Schristos if (list_is_singular(&kgem->requests[ring])) 62139a906b70Schristos return true; 62149a906b70Schristos 62159a906b70Schristos return __kgem_ring_is_idle(kgem, ring); 62169a906b70Schristos} 62179a906b70Schristos 621803b705cfSriastradhinline static bool needs_semaphore(struct kgem *kgem, struct kgem_bo *bo) 621903b705cfSriastradh{ 62209a906b70Schristos if (kgem->needs_semaphore) 62219a906b70Schristos return false; 62229a906b70Schristos 62239a906b70Schristos if (bo->rq == NULL || RQ_RING(bo->rq) == kgem->ring) 62249a906b70Schristos return false; 62259a906b70Schristos 62269a906b70Schristos kgem->needs_semaphore = true; 62279a906b70Schristos return true; 62289a906b70Schristos} 62299a906b70Schristos 62309a906b70Schristosinline static bool needs_reservation(struct kgem *kgem, struct kgem_bo *bo) 62319a906b70Schristos{ 62329a906b70Schristos if (kgem->needs_reservation) 62339a906b70Schristos return false; 62349a906b70Schristos 62359a906b70Schristos if (bo->presumed_offset) 62369a906b70Schristos return false; 62379a906b70Schristos 62389a906b70Schristos kgem->needs_reservation = true; 62399a906b70Schristos return nearly_idle(kgem); 62409a906b70Schristos} 62419a906b70Schristos 62429a906b70Schristosinline static bool needs_batch_flush(struct kgem *kgem, struct kgem_bo *bo) 62439a906b70Schristos{ 62449a906b70Schristos bool flush = false; 62459a906b70Schristos 62469a906b70Schristos if (needs_semaphore(kgem, bo)) { 62479a906b70Schristos DBG(("%s: flushing before handle=%d for required semaphore\n", __FUNCTION__, bo->handle)); 62489a906b70Schristos flush = true; 62499a906b70Schristos } 62509a906b70Schristos 62519a906b70Schristos if (needs_reservation(kgem, bo)) { 62529a906b70Schristos DBG(("%s: flushing before handle=%d for new reservation\n", __FUNCTION__, bo->handle)); 62539a906b70Schristos flush = true; 62549a906b70Schristos } 62559a906b70Schristos 62569a906b70Schristos return kgem->nreloc ? flush : false; 62579a906b70Schristos} 62589a906b70Schristos 62599a906b70Schristosstatic bool aperture_check(struct kgem *kgem, unsigned num_pages) 62609a906b70Schristos{ 62619a906b70Schristos struct drm_i915_gem_get_aperture aperture; 62629a906b70Schristos int reserve; 62639a906b70Schristos 62649a906b70Schristos if (kgem->aperture) 62659a906b70Schristos return false; 62669a906b70Schristos 62679a906b70Schristos /* Leave some space in case of alignment issues */ 62689a906b70Schristos reserve = kgem->aperture_mappable / 2; 62699a906b70Schristos if (kgem->gen < 033 && reserve < kgem->aperture_max_fence) 62709a906b70Schristos reserve = kgem->aperture_max_fence; 62719a906b70Schristos if (!kgem->has_llc) 62729a906b70Schristos reserve += kgem->nexec * PAGE_SIZE * 2; 62739a906b70Schristos 62749a906b70Schristos DBG(("%s: num_pages=%d, holding %d pages in reserve, total aperture %d\n", 62759a906b70Schristos __FUNCTION__, num_pages, reserve, kgem->aperture_total)); 62769a906b70Schristos num_pages += reserve; 62779a906b70Schristos 62789a906b70Schristos VG_CLEAR(aperture); 62799a906b70Schristos aperture.aper_available_size = kgem->aperture_total; 62809a906b70Schristos aperture.aper_available_size *= PAGE_SIZE; 62819a906b70Schristos (void)do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_GET_APERTURE, &aperture); 62829a906b70Schristos 62839a906b70Schristos DBG(("%s: aperture required %ld bytes, available %ld bytes\n", 62849a906b70Schristos __FUNCTION__, 62859a906b70Schristos (long)num_pages * PAGE_SIZE, 62869a906b70Schristos (long)aperture.aper_available_size)); 62879a906b70Schristos 62889a906b70Schristos return num_pages <= aperture.aper_available_size / PAGE_SIZE; 62899a906b70Schristos} 62909a906b70Schristos 62919a906b70Schristosstatic inline bool kgem_flush(struct kgem *kgem, bool flush) 62929a906b70Schristos{ 62939a906b70Schristos if (unlikely(kgem->wedged)) 62949a906b70Schristos return false; 62959a906b70Schristos 62969a906b70Schristos if (kgem->nreloc == 0) 62979a906b70Schristos return true; 62989a906b70Schristos 629963ef14f0Smrg if (__to_sna(kgem)->flags & SNA_POWERSAVE) 63009a906b70Schristos return true; 63019a906b70Schristos 63029a906b70Schristos if (kgem->flush == flush && kgem->aperture < kgem->aperture_low) 63039a906b70Schristos return true; 63049a906b70Schristos 63059a906b70Schristos DBG(("%s: opportunistic flushing? flush=%d,%d, aperture=%d/%d, idle?=%d\n", 63069a906b70Schristos __FUNCTION__, kgem->flush, flush, kgem->aperture, kgem->aperture_low, kgem_ring_is_idle(kgem, kgem->ring))); 63079a906b70Schristos return !kgem_ring_is_idle(kgem, kgem->ring); 630803b705cfSriastradh} 630903b705cfSriastradh 631003b705cfSriastradhbool kgem_check_bo(struct kgem *kgem, ...) 631103b705cfSriastradh{ 631203b705cfSriastradh va_list ap; 631303b705cfSriastradh struct kgem_bo *bo; 631403b705cfSriastradh int num_exec = 0; 631503b705cfSriastradh int num_pages = 0; 631603b705cfSriastradh bool flush = false; 63179a906b70Schristos bool busy = true; 631803b705cfSriastradh 631903b705cfSriastradh va_start(ap, kgem); 632003b705cfSriastradh while ((bo = va_arg(ap, struct kgem_bo *))) { 632103b705cfSriastradh while (bo->proxy) 632203b705cfSriastradh bo = bo->proxy; 632303b705cfSriastradh if (bo->exec) 632403b705cfSriastradh continue; 632503b705cfSriastradh 63269a906b70Schristos if (needs_batch_flush(kgem, bo)) { 63279a906b70Schristos va_end(ap); 632803b705cfSriastradh return false; 63299a906b70Schristos } 633003b705cfSriastradh 633103b705cfSriastradh num_pages += num_pages(bo); 633203b705cfSriastradh num_exec++; 633303b705cfSriastradh 633403b705cfSriastradh flush |= bo->flush; 63359a906b70Schristos busy &= bo->rq != NULL; 633603b705cfSriastradh } 633703b705cfSriastradh va_end(ap); 633803b705cfSriastradh 633903b705cfSriastradh DBG(("%s: num_pages=+%d, num_exec=+%d\n", 634003b705cfSriastradh __FUNCTION__, num_pages, num_exec)); 634103b705cfSriastradh 634203b705cfSriastradh if (!num_pages) 634303b705cfSriastradh return true; 634403b705cfSriastradh 63459a906b70Schristos if (kgem->nexec + num_exec >= KGEM_EXEC_SIZE(kgem)) { 63469a906b70Schristos DBG(("%s: out of exec slots (%d + %d / %d)\n", __FUNCTION__, 63479a906b70Schristos kgem->nexec, num_exec, KGEM_EXEC_SIZE(kgem))); 634803b705cfSriastradh return false; 634903b705cfSriastradh } 635003b705cfSriastradh 635103b705cfSriastradh if (num_pages + kgem->aperture > kgem->aperture_high) { 63529a906b70Schristos DBG(("%s: final aperture usage (%d + %d) is greater than high water mark (%d)\n", 63539a906b70Schristos __FUNCTION__, kgem->aperture, num_pages, kgem->aperture_high)); 63549a906b70Schristos return aperture_check(kgem, num_pages); 635503b705cfSriastradh } 635603b705cfSriastradh 63579a906b70Schristos if (busy) 63589a906b70Schristos return true; 635903b705cfSriastradh 63609a906b70Schristos return kgem_flush(kgem, flush); 636103b705cfSriastradh} 636203b705cfSriastradh 636303b705cfSriastradhbool kgem_check_bo_fenced(struct kgem *kgem, struct kgem_bo *bo) 636403b705cfSriastradh{ 636503b705cfSriastradh assert(bo->refcnt); 636603b705cfSriastradh while (bo->proxy) 636703b705cfSriastradh bo = bo->proxy; 636803b705cfSriastradh assert(bo->refcnt); 636903b705cfSriastradh 637003b705cfSriastradh if (bo->exec) { 637103b705cfSriastradh if (kgem->gen < 040 && 637203b705cfSriastradh bo->tiling != I915_TILING_NONE && 637303b705cfSriastradh (bo->exec->flags & EXEC_OBJECT_NEEDS_FENCE) == 0) { 63749a906b70Schristos uint32_t size; 63759a906b70Schristos 63769a906b70Schristos assert(bo->tiling == I915_TILING_X); 63779a906b70Schristos 637803b705cfSriastradh if (kgem->nfence >= kgem->fence_max) 637903b705cfSriastradh return false; 638003b705cfSriastradh 63819a906b70Schristos if (kgem->aperture_fenced) { 63829a906b70Schristos size = 3*kgem->aperture_fenced; 63839a906b70Schristos if (kgem->aperture_total == kgem->aperture_mappable) 63849a906b70Schristos size += kgem->aperture; 63859a906b70Schristos if (size > kgem->aperture_fenceable && 63869a906b70Schristos kgem_ring_is_idle(kgem, kgem->ring)) { 63879a906b70Schristos DBG(("%s: opportunistic fence flush\n", __FUNCTION__)); 63889a906b70Schristos return false; 63899a906b70Schristos } 63909a906b70Schristos } 639103b705cfSriastradh 63929a906b70Schristos size = kgem_bo_fenced_size(kgem, bo); 63939a906b70Schristos if (size > kgem->aperture_max_fence) 63949a906b70Schristos kgem->aperture_max_fence = size; 63959a906b70Schristos size += kgem->aperture_fenced; 63969a906b70Schristos if (kgem->gen < 033 && size < 2 * kgem->aperture_max_fence) 63979a906b70Schristos size = 2 * kgem->aperture_max_fence; 63989a906b70Schristos if (kgem->aperture_total == kgem->aperture_mappable) 63999a906b70Schristos size += kgem->aperture; 64009a906b70Schristos if (size > kgem->aperture_fenceable) { 64019a906b70Schristos DBG(("%s: estimated fence space required %d (fenced=%d, max_fence=%d, aperture=%d) exceeds fenceable aperture %d\n", 64029a906b70Schristos __FUNCTION__, size, kgem->aperture_fenced, kgem->aperture_max_fence, kgem->aperture, kgem->aperture_fenceable)); 640303b705cfSriastradh return false; 64049a906b70Schristos } 640503b705cfSriastradh } 640603b705cfSriastradh 640703b705cfSriastradh return true; 640803b705cfSriastradh } 640903b705cfSriastradh 641003b705cfSriastradh if (kgem->nexec >= KGEM_EXEC_SIZE(kgem) - 1) 641103b705cfSriastradh return false; 641203b705cfSriastradh 64139a906b70Schristos if (needs_batch_flush(kgem, bo)) 641403b705cfSriastradh return false; 641503b705cfSriastradh 641603b705cfSriastradh assert_tiling(kgem, bo); 641703b705cfSriastradh if (kgem->gen < 040 && bo->tiling != I915_TILING_NONE) { 64189a906b70Schristos uint32_t size; 64199a906b70Schristos 64209a906b70Schristos assert(bo->tiling == I915_TILING_X); 64219a906b70Schristos 642203b705cfSriastradh if (kgem->nfence >= kgem->fence_max) 642303b705cfSriastradh return false; 642403b705cfSriastradh 64259a906b70Schristos if (kgem->aperture_fenced) { 64269a906b70Schristos size = 3*kgem->aperture_fenced; 64279a906b70Schristos if (kgem->aperture_total == kgem->aperture_mappable) 64289a906b70Schristos size += kgem->aperture; 64299a906b70Schristos if (size > kgem->aperture_fenceable && 64309a906b70Schristos kgem_ring_is_idle(kgem, kgem->ring)) { 64319a906b70Schristos DBG(("%s: opportunistic fence flush\n", __FUNCTION__)); 64329a906b70Schristos return false; 64339a906b70Schristos } 64349a906b70Schristos } 643503b705cfSriastradh 64369a906b70Schristos size = kgem_bo_fenced_size(kgem, bo); 64379a906b70Schristos if (size > kgem->aperture_max_fence) 64389a906b70Schristos kgem->aperture_max_fence = size; 64399a906b70Schristos size += kgem->aperture_fenced; 64409a906b70Schristos if (kgem->gen < 033 && size < 2 * kgem->aperture_max_fence) 64419a906b70Schristos size = 2 * kgem->aperture_max_fence; 64429a906b70Schristos if (kgem->aperture_total == kgem->aperture_mappable) 64439a906b70Schristos size += kgem->aperture; 64449a906b70Schristos if (size > kgem->aperture_fenceable) { 64459a906b70Schristos DBG(("%s: estimated fence space required %d (fenced=%d, max_fence=%d, aperture=%d) exceeds fenceable aperture %d\n", 64469a906b70Schristos __FUNCTION__, size, kgem->aperture_fenced, kgem->aperture_max_fence, kgem->aperture, kgem->aperture_fenceable)); 644703b705cfSriastradh return false; 64489a906b70Schristos } 644903b705cfSriastradh } 645003b705cfSriastradh 64519a906b70Schristos if (kgem->aperture + kgem->aperture_fenced + num_pages(bo) > kgem->aperture_high) { 64529a906b70Schristos DBG(("%s: final aperture usage (%d + %d) is greater than high water mark (%d)\n", 64539a906b70Schristos __FUNCTION__, kgem->aperture, num_pages(bo), kgem->aperture_high)); 64549a906b70Schristos return aperture_check(kgem, num_pages(bo)); 64559a906b70Schristos } 64569a906b70Schristos 64579a906b70Schristos if (bo->rq) 64589a906b70Schristos return true; 64599a906b70Schristos 64609a906b70Schristos return kgem_flush(kgem, bo->flush); 646103b705cfSriastradh} 646203b705cfSriastradh 646303b705cfSriastradhbool kgem_check_many_bo_fenced(struct kgem *kgem, ...) 646403b705cfSriastradh{ 646503b705cfSriastradh va_list ap; 646603b705cfSriastradh struct kgem_bo *bo; 646703b705cfSriastradh int num_fence = 0; 646803b705cfSriastradh int num_exec = 0; 646903b705cfSriastradh int num_pages = 0; 647003b705cfSriastradh int fenced_size = 0; 647103b705cfSriastradh bool flush = false; 64729a906b70Schristos bool busy = true; 647303b705cfSriastradh 647403b705cfSriastradh va_start(ap, kgem); 647503b705cfSriastradh while ((bo = va_arg(ap, struct kgem_bo *))) { 647603b705cfSriastradh assert(bo->refcnt); 647703b705cfSriastradh while (bo->proxy) 647803b705cfSriastradh bo = bo->proxy; 647903b705cfSriastradh assert(bo->refcnt); 648003b705cfSriastradh if (bo->exec) { 648103b705cfSriastradh if (kgem->gen >= 040 || bo->tiling == I915_TILING_NONE) 648203b705cfSriastradh continue; 648303b705cfSriastradh 648403b705cfSriastradh if ((bo->exec->flags & EXEC_OBJECT_NEEDS_FENCE) == 0) { 648503b705cfSriastradh fenced_size += kgem_bo_fenced_size(kgem, bo); 648603b705cfSriastradh num_fence++; 648703b705cfSriastradh } 648803b705cfSriastradh 648903b705cfSriastradh continue; 649003b705cfSriastradh } 649103b705cfSriastradh 64929a906b70Schristos if (needs_batch_flush(kgem, bo)) { 64939a906b70Schristos va_end(ap); 649403b705cfSriastradh return false; 64959a906b70Schristos } 649603b705cfSriastradh 649703b705cfSriastradh assert_tiling(kgem, bo); 649803b705cfSriastradh num_pages += num_pages(bo); 649903b705cfSriastradh num_exec++; 650003b705cfSriastradh if (kgem->gen < 040 && bo->tiling) { 65019a906b70Schristos uint32_t size = kgem_bo_fenced_size(kgem, bo); 65029a906b70Schristos if (size > kgem->aperture_max_fence) 65039a906b70Schristos kgem->aperture_max_fence = size; 65049a906b70Schristos fenced_size += size; 650503b705cfSriastradh num_fence++; 650603b705cfSriastradh } 650703b705cfSriastradh 650803b705cfSriastradh flush |= bo->flush; 65099a906b70Schristos busy &= bo->rq != NULL; 651003b705cfSriastradh } 651103b705cfSriastradh va_end(ap); 651203b705cfSriastradh 651303b705cfSriastradh if (num_fence) { 65149a906b70Schristos uint32_t size; 65159a906b70Schristos 651603b705cfSriastradh if (kgem->nfence + num_fence > kgem->fence_max) 651703b705cfSriastradh return false; 651803b705cfSriastradh 65199a906b70Schristos if (kgem->aperture_fenced) { 65209a906b70Schristos size = 3*kgem->aperture_fenced; 65219a906b70Schristos if (kgem->aperture_total == kgem->aperture_mappable) 65229a906b70Schristos size += kgem->aperture; 65239a906b70Schristos if (size > kgem->aperture_fenceable && 65249a906b70Schristos kgem_ring_is_idle(kgem, kgem->ring)) { 65259a906b70Schristos DBG(("%s: opportunistic fence flush\n", __FUNCTION__)); 65269a906b70Schristos return false; 65279a906b70Schristos } 65289a906b70Schristos } 652903b705cfSriastradh 65309a906b70Schristos size = kgem->aperture_fenced; 65319a906b70Schristos size += fenced_size; 65329a906b70Schristos if (kgem->gen < 033 && size < 2 * kgem->aperture_max_fence) 65339a906b70Schristos size = 2 * kgem->aperture_max_fence; 65349a906b70Schristos if (kgem->aperture_total == kgem->aperture_mappable) 65359a906b70Schristos size += kgem->aperture; 65369a906b70Schristos if (size > kgem->aperture_fenceable) { 65379a906b70Schristos DBG(("%s: estimated fence space required %d (fenced=%d, max_fence=%d, aperture=%d) exceeds fenceable aperture %d\n", 65389a906b70Schristos __FUNCTION__, size, kgem->aperture_fenced, kgem->aperture_max_fence, kgem->aperture, kgem->aperture_fenceable)); 653903b705cfSriastradh return false; 65409a906b70Schristos } 654103b705cfSriastradh } 654203b705cfSriastradh 65439a906b70Schristos if (num_pages == 0) 65449a906b70Schristos return true; 654503b705cfSriastradh 65469a906b70Schristos if (kgem->nexec + num_exec >= KGEM_EXEC_SIZE(kgem)) 65479a906b70Schristos return false; 654803b705cfSriastradh 65499a906b70Schristos if (num_pages + kgem->aperture > kgem->aperture_high - kgem->aperture_fenced) { 65509a906b70Schristos DBG(("%s: final aperture usage (%d + %d + %d) is greater than high water mark (%d)\n", 65519a906b70Schristos __FUNCTION__, kgem->aperture, kgem->aperture_fenced, num_pages, kgem->aperture_high)); 65529a906b70Schristos return aperture_check(kgem, num_pages); 655303b705cfSriastradh } 655403b705cfSriastradh 65559a906b70Schristos if (busy) 65569a906b70Schristos return true; 65579a906b70Schristos 65589a906b70Schristos return kgem_flush(kgem, flush); 655903b705cfSriastradh} 656003b705cfSriastradh 656163ef14f0Smrgvoid __kgem_bcs_set_tiling(struct kgem *kgem, 656263ef14f0Smrg struct kgem_bo *src, 656363ef14f0Smrg struct kgem_bo *dst) 656463ef14f0Smrg{ 656563ef14f0Smrg uint32_t state, *b; 656663ef14f0Smrg 656763ef14f0Smrg DBG(("%s: src handle=%d:tiling=%d, dst handle=%d:tiling=%d\n", 656863ef14f0Smrg __FUNCTION__, 656963ef14f0Smrg src ? src->handle : 0, src ? src->tiling : 0, 657063ef14f0Smrg dst ? dst->handle : 0, dst ? dst->tiling : 0)); 657163ef14f0Smrg assert(kgem->mode == KGEM_BLT); 657263ef14f0Smrg assert(dst == NULL || kgem_bo_can_blt(kgem, dst)); 657363ef14f0Smrg assert(src == NULL || kgem_bo_can_blt(kgem, src)); 657463ef14f0Smrg 657563ef14f0Smrg state = 0; 657663ef14f0Smrg if (dst && dst->tiling == I915_TILING_Y) 657763ef14f0Smrg state |= BCS_DST_Y; 657863ef14f0Smrg if (src && src->tiling == I915_TILING_Y) 657963ef14f0Smrg state |= BCS_SRC_Y; 658063ef14f0Smrg 658163ef14f0Smrg if (kgem->bcs_state == state) 658263ef14f0Smrg return; 658363ef14f0Smrg 658463ef14f0Smrg DBG(("%s: updating SWCTRL %x -> %x\n", __FUNCTION__, 658563ef14f0Smrg kgem->bcs_state, state)); 658663ef14f0Smrg 658763ef14f0Smrg /* Over-estimate space in case we need to re-emit the cmd packet */ 658863ef14f0Smrg if (!kgem_check_batch(kgem, 24)) { 658963ef14f0Smrg _kgem_submit(kgem); 659063ef14f0Smrg _kgem_set_mode(kgem, KGEM_BLT); 659163ef14f0Smrg if (state == 0) 659263ef14f0Smrg return; 659363ef14f0Smrg } 659463ef14f0Smrg 659563ef14f0Smrg b = kgem->batch + kgem->nbatch; 659663ef14f0Smrg if (kgem->nbatch) { 659763ef14f0Smrg *b++ = MI_FLUSH_DW; 659863ef14f0Smrg *b++ = 0; 659963ef14f0Smrg *b++ = 0; 660063ef14f0Smrg *b++ = 0; 660163ef14f0Smrg } 660263ef14f0Smrg *b++ = MI_LOAD_REGISTER_IMM; 660363ef14f0Smrg *b++ = BCS_SWCTRL; 660463ef14f0Smrg *b++ = (BCS_SRC_Y | BCS_DST_Y) << 16 | state; 660563ef14f0Smrg kgem->nbatch = b - kgem->batch; 660663ef14f0Smrg 660763ef14f0Smrg kgem->bcs_state = state; 660863ef14f0Smrg} 660963ef14f0Smrg 661003b705cfSriastradhuint32_t kgem_add_reloc(struct kgem *kgem, 661103b705cfSriastradh uint32_t pos, 661203b705cfSriastradh struct kgem_bo *bo, 661303b705cfSriastradh uint32_t read_write_domain, 661403b705cfSriastradh uint32_t delta) 661503b705cfSriastradh{ 661603b705cfSriastradh int index; 661703b705cfSriastradh 661803b705cfSriastradh DBG(("%s: handle=%d, pos=%d, delta=%d, domains=%08x\n", 661903b705cfSriastradh __FUNCTION__, bo ? bo->handle : 0, pos, delta, read_write_domain)); 662003b705cfSriastradh 66219a906b70Schristos assert(kgem->gen < 0100); 662203b705cfSriastradh assert((read_write_domain & 0x7fff) == 0 || bo != NULL); 662303b705cfSriastradh 662403b705cfSriastradh index = kgem->nreloc++; 662503b705cfSriastradh assert(index < ARRAY_SIZE(kgem->reloc)); 662603b705cfSriastradh kgem->reloc[index].offset = pos * sizeof(kgem->batch[0]); 662703b705cfSriastradh if (bo) { 66289a906b70Schristos assert(kgem->mode != KGEM_NONE); 662903b705cfSriastradh assert(bo->refcnt); 663003b705cfSriastradh while (bo->proxy) { 663103b705cfSriastradh DBG(("%s: adding proxy [delta=%d] for handle=%d\n", 663203b705cfSriastradh __FUNCTION__, bo->delta, bo->handle)); 663303b705cfSriastradh delta += bo->delta; 663403b705cfSriastradh assert(bo->handle == bo->proxy->handle); 663503b705cfSriastradh /* need to release the cache upon batch submit */ 663603b705cfSriastradh if (bo->exec == NULL) { 663703b705cfSriastradh list_move_tail(&bo->request, 663803b705cfSriastradh &kgem->next_request->buffers); 663903b705cfSriastradh bo->rq = MAKE_REQUEST(kgem->next_request, 664003b705cfSriastradh kgem->ring); 664103b705cfSriastradh bo->exec = &_kgem_dummy_exec; 66429a906b70Schristos bo->domain = DOMAIN_GPU; 664303b705cfSriastradh } 664403b705cfSriastradh 664503b705cfSriastradh if (read_write_domain & 0x7fff && !bo->gpu_dirty) 664603b705cfSriastradh __kgem_bo_mark_dirty(bo); 664703b705cfSriastradh 664803b705cfSriastradh bo = bo->proxy; 664903b705cfSriastradh assert(bo->refcnt); 665003b705cfSriastradh } 665103b705cfSriastradh assert(bo->refcnt); 665203b705cfSriastradh 665303b705cfSriastradh if (bo->exec == NULL) 665403b705cfSriastradh kgem_add_bo(kgem, bo); 665503b705cfSriastradh assert(bo->rq == MAKE_REQUEST(kgem->next_request, kgem->ring)); 665603b705cfSriastradh assert(RQ_RING(bo->rq) == kgem->ring); 665703b705cfSriastradh 665803b705cfSriastradh if (kgem->gen < 040 && read_write_domain & KGEM_RELOC_FENCED) { 665903b705cfSriastradh if (bo->tiling && 666003b705cfSriastradh (bo->exec->flags & EXEC_OBJECT_NEEDS_FENCE) == 0) { 66619a906b70Schristos assert(bo->tiling == I915_TILING_X); 666203b705cfSriastradh assert(kgem->nfence < kgem->fence_max); 666303b705cfSriastradh kgem->aperture_fenced += 666403b705cfSriastradh kgem_bo_fenced_size(kgem, bo); 666503b705cfSriastradh kgem->nfence++; 666603b705cfSriastradh } 666703b705cfSriastradh bo->exec->flags |= EXEC_OBJECT_NEEDS_FENCE; 666803b705cfSriastradh } 666903b705cfSriastradh 667003b705cfSriastradh kgem->reloc[index].delta = delta; 667103b705cfSriastradh kgem->reloc[index].target_handle = bo->target_handle; 667203b705cfSriastradh kgem->reloc[index].presumed_offset = bo->presumed_offset; 667303b705cfSriastradh 667403b705cfSriastradh if (read_write_domain & 0x7fff && !bo->gpu_dirty) { 667503b705cfSriastradh assert(!bo->snoop || kgem->can_blt_cpu); 667603b705cfSriastradh __kgem_bo_mark_dirty(bo); 667703b705cfSriastradh } 667803b705cfSriastradh 667903b705cfSriastradh delta += bo->presumed_offset; 668003b705cfSriastradh } else { 668103b705cfSriastradh kgem->reloc[index].delta = delta; 668203b705cfSriastradh kgem->reloc[index].target_handle = ~0U; 668303b705cfSriastradh kgem->reloc[index].presumed_offset = 0; 668403b705cfSriastradh if (kgem->nreloc__self < 256) 668503b705cfSriastradh kgem->reloc__self[kgem->nreloc__self++] = index; 668603b705cfSriastradh } 668703b705cfSriastradh kgem->reloc[index].read_domains = read_write_domain >> 16; 668803b705cfSriastradh kgem->reloc[index].write_domain = read_write_domain & 0x7fff; 668903b705cfSriastradh 669003b705cfSriastradh return delta; 669103b705cfSriastradh} 669203b705cfSriastradh 66939a906b70Schristosuint64_t kgem_add_reloc64(struct kgem *kgem, 66949a906b70Schristos uint32_t pos, 66959a906b70Schristos struct kgem_bo *bo, 66969a906b70Schristos uint32_t read_write_domain, 66979a906b70Schristos uint64_t delta) 66989a906b70Schristos{ 66999a906b70Schristos int index; 67009a906b70Schristos 67019a906b70Schristos DBG(("%s: handle=%d, pos=%d, delta=%ld, domains=%08x\n", 67029a906b70Schristos __FUNCTION__, bo ? bo->handle : 0, pos, (long)delta, read_write_domain)); 67039a906b70Schristos 67049a906b70Schristos assert(kgem->gen >= 0100); 67059a906b70Schristos assert((read_write_domain & 0x7fff) == 0 || bo != NULL); 67069a906b70Schristos 67079a906b70Schristos index = kgem->nreloc++; 67089a906b70Schristos assert(index < ARRAY_SIZE(kgem->reloc)); 67099a906b70Schristos kgem->reloc[index].offset = pos * sizeof(kgem->batch[0]); 67109a906b70Schristos if (bo) { 67119a906b70Schristos assert(kgem->mode != KGEM_NONE); 67129a906b70Schristos assert(bo->refcnt); 67139a906b70Schristos while (bo->proxy) { 67149a906b70Schristos DBG(("%s: adding proxy [delta=%ld] for handle=%d\n", 67159a906b70Schristos __FUNCTION__, (long)bo->delta, bo->handle)); 67169a906b70Schristos delta += bo->delta; 67179a906b70Schristos assert(bo->handle == bo->proxy->handle); 67189a906b70Schristos /* need to release the cache upon batch submit */ 67199a906b70Schristos if (bo->exec == NULL) { 67209a906b70Schristos list_move_tail(&bo->request, 67219a906b70Schristos &kgem->next_request->buffers); 67229a906b70Schristos bo->rq = MAKE_REQUEST(kgem->next_request, 67239a906b70Schristos kgem->ring); 67249a906b70Schristos bo->exec = &_kgem_dummy_exec; 67259a906b70Schristos bo->domain = DOMAIN_GPU; 67269a906b70Schristos } 67279a906b70Schristos 67289a906b70Schristos if (read_write_domain & 0x7fff && !bo->gpu_dirty) 67299a906b70Schristos __kgem_bo_mark_dirty(bo); 67309a906b70Schristos 67319a906b70Schristos bo = bo->proxy; 67329a906b70Schristos assert(bo->refcnt); 67339a906b70Schristos } 67349a906b70Schristos assert(bo->refcnt); 67359a906b70Schristos 67369a906b70Schristos if (bo->exec == NULL) 67379a906b70Schristos kgem_add_bo(kgem, bo); 67389a906b70Schristos assert(bo->rq == MAKE_REQUEST(kgem->next_request, kgem->ring)); 67399a906b70Schristos assert(RQ_RING(bo->rq) == kgem->ring); 67409a906b70Schristos 67419a906b70Schristos DBG(("%s[%d] = (delta=%d, target handle=%d, presumed=%llx)\n", 67429a906b70Schristos __FUNCTION__, index, delta, bo->target_handle, (long long)bo->presumed_offset)); 67439a906b70Schristos kgem->reloc[index].delta = delta; 67449a906b70Schristos kgem->reloc[index].target_handle = bo->target_handle; 67459a906b70Schristos kgem->reloc[index].presumed_offset = bo->presumed_offset; 67469a906b70Schristos 67479a906b70Schristos if (read_write_domain & 0x7fff && !bo->gpu_dirty) { 67489a906b70Schristos assert(!bo->snoop || kgem->can_blt_cpu); 67499a906b70Schristos __kgem_bo_mark_dirty(bo); 67509a906b70Schristos } 67519a906b70Schristos 67529a906b70Schristos delta += bo->presumed_offset; 67539a906b70Schristos } else { 67549a906b70Schristos DBG(("%s[%d] = (delta=%d, target handle=batch)\n", 67559a906b70Schristos __FUNCTION__, index, delta)); 67569a906b70Schristos kgem->reloc[index].delta = delta; 67579a906b70Schristos kgem->reloc[index].target_handle = ~0U; 67589a906b70Schristos kgem->reloc[index].presumed_offset = 0; 67599a906b70Schristos if (kgem->nreloc__self < 256) 67609a906b70Schristos kgem->reloc__self[kgem->nreloc__self++] = index; 67619a906b70Schristos } 67629a906b70Schristos kgem->reloc[index].read_domains = read_write_domain >> 16; 67639a906b70Schristos kgem->reloc[index].write_domain = read_write_domain & 0x7fff; 67649a906b70Schristos 67659a906b70Schristos return delta; 67669a906b70Schristos} 67679a906b70Schristos 676803b705cfSriastradhstatic void kgem_trim_vma_cache(struct kgem *kgem, int type, int bucket) 676903b705cfSriastradh{ 677003b705cfSriastradh int i, j; 677103b705cfSriastradh 677203b705cfSriastradh DBG(("%s: type=%d, count=%d (bucket: %d)\n", 677303b705cfSriastradh __FUNCTION__, type, kgem->vma[type].count, bucket)); 677403b705cfSriastradh if (kgem->vma[type].count <= 0) 677503b705cfSriastradh return; 677603b705cfSriastradh 677703b705cfSriastradh if (kgem->need_purge) 677803b705cfSriastradh kgem_purge_cache(kgem); 677903b705cfSriastradh 678003b705cfSriastradh /* vma are limited on a per-process basis to around 64k. 678103b705cfSriastradh * This includes all malloc arenas as well as other file 678203b705cfSriastradh * mappings. In order to be fair and not hog the cache, 678303b705cfSriastradh * and more importantly not to exhaust that limit and to 678403b705cfSriastradh * start failing mappings, we keep our own number of open 678503b705cfSriastradh * vma to within a conservative value. 678603b705cfSriastradh */ 678703b705cfSriastradh i = 0; 678803b705cfSriastradh while (kgem->vma[type].count > 0) { 678903b705cfSriastradh struct kgem_bo *bo = NULL; 679003b705cfSriastradh 679103b705cfSriastradh for (j = 0; 679203b705cfSriastradh bo == NULL && j < ARRAY_SIZE(kgem->vma[type].inactive); 679303b705cfSriastradh j++) { 679403b705cfSriastradh struct list *head = &kgem->vma[type].inactive[i++%ARRAY_SIZE(kgem->vma[type].inactive)]; 679503b705cfSriastradh if (!list_is_empty(head)) 679603b705cfSriastradh bo = list_last_entry(head, struct kgem_bo, vma); 679703b705cfSriastradh } 679803b705cfSriastradh if (bo == NULL) 679903b705cfSriastradh break; 680003b705cfSriastradh 680103b705cfSriastradh DBG(("%s: discarding inactive %s vma cache for %d\n", 68029a906b70Schristos __FUNCTION__, type ? "CPU" : "GTT", bo->handle)); 68039a906b70Schristos 680403b705cfSriastradh assert(bo->rq == NULL); 6805813957e3Ssnj if (type) { 6806813957e3Ssnj VG(VALGRIND_MAKE_MEM_NOACCESS(MAP(bo->map__cpu), bytes(bo))); 6807813957e3Ssnj munmap(MAP(bo->map__cpu), bytes(bo)); 6808813957e3Ssnj bo->map__cpu = NULL; 6809813957e3Ssnj } else { 6810813957e3Ssnj if (bo->map__wc) { 6811813957e3Ssnj VG(VALGRIND_MAKE_MEM_NOACCESS(bo->map__wc, bytes(bo))); 6812813957e3Ssnj munmap(bo->map__wc, bytes(bo)); 6813813957e3Ssnj bo->map__wc = NULL; 6814813957e3Ssnj } 6815813957e3Ssnj if (bo->map__gtt) { 6816813957e3Ssnj munmap(bo->map__gtt, bytes(bo)); 6817813957e3Ssnj bo->map__gtt = NULL; 6818813957e3Ssnj } 6819813957e3Ssnj } 682003b705cfSriastradh 682103b705cfSriastradh list_del(&bo->vma); 682203b705cfSriastradh kgem->vma[type].count--; 682303b705cfSriastradh } 682403b705cfSriastradh} 682503b705cfSriastradh 6826813957e3Ssnjstatic void *__kgem_bo_map__gtt_or_wc(struct kgem *kgem, struct kgem_bo *bo) 682703b705cfSriastradh{ 682803b705cfSriastradh void *ptr; 682903b705cfSriastradh 6830813957e3Ssnj DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle)); 6831813957e3Ssnj 6832813957e3Ssnj assert(bo->proxy == NULL); 6833813957e3Ssnj assert(!bo->snoop); 6834813957e3Ssnj 6835813957e3Ssnj kgem_trim_vma_cache(kgem, MAP_GTT, bucket(bo)); 6836813957e3Ssnj 6837813957e3Ssnj if (bo->tiling || !kgem->has_wc_mmap) { 6838813957e3Ssnj assert(kgem->gen != 021 || bo->tiling != I915_TILING_Y); 683963ef14f0Smrg warn_unless(num_pages(bo) <= kgem->aperture_mappable / 2); 6840813957e3Ssnj 6841813957e3Ssnj ptr = bo->map__gtt; 6842813957e3Ssnj if (ptr == NULL) 6843813957e3Ssnj ptr = __kgem_bo_map__gtt(kgem, bo); 6844813957e3Ssnj } else { 6845813957e3Ssnj ptr = bo->map__wc; 6846813957e3Ssnj if (ptr == NULL) 6847813957e3Ssnj ptr = __kgem_bo_map__wc(kgem, bo); 6848813957e3Ssnj } 6849813957e3Ssnj 6850813957e3Ssnj return ptr; 6851813957e3Ssnj} 6852813957e3Ssnj 6853813957e3Ssnjvoid *kgem_bo_map__async(struct kgem *kgem, struct kgem_bo *bo) 6854813957e3Ssnj{ 68559a906b70Schristos DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__, 68569a906b70Schristos bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain)); 685703b705cfSriastradh 685803b705cfSriastradh assert(bo->proxy == NULL); 685903b705cfSriastradh assert(list_is_empty(&bo->list)); 686003b705cfSriastradh assert_tiling(kgem, bo); 68619a906b70Schristos assert(!bo->purged || bo->reusable); 686203b705cfSriastradh 686303b705cfSriastradh if (bo->tiling == I915_TILING_NONE && !bo->scanout && kgem->has_llc) { 686403b705cfSriastradh DBG(("%s: converting request for GTT map into CPU map\n", 686503b705cfSriastradh __FUNCTION__)); 686603b705cfSriastradh return kgem_bo_map__cpu(kgem, bo); 686703b705cfSriastradh } 686803b705cfSriastradh 6869813957e3Ssnj return __kgem_bo_map__gtt_or_wc(kgem, bo); 687003b705cfSriastradh} 687103b705cfSriastradh 687203b705cfSriastradhvoid *kgem_bo_map(struct kgem *kgem, struct kgem_bo *bo) 687303b705cfSriastradh{ 687403b705cfSriastradh void *ptr; 687503b705cfSriastradh 68769a906b70Schristos DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__, 68779a906b70Schristos bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain)); 687803b705cfSriastradh 687903b705cfSriastradh assert(bo->proxy == NULL); 688003b705cfSriastradh assert(list_is_empty(&bo->list)); 688103b705cfSriastradh assert(bo->exec == NULL); 688203b705cfSriastradh assert_tiling(kgem, bo); 68839a906b70Schristos assert(!bo->purged || bo->reusable); 688403b705cfSriastradh 688503b705cfSriastradh if (bo->tiling == I915_TILING_NONE && !bo->scanout && 688603b705cfSriastradh (kgem->has_llc || bo->domain == DOMAIN_CPU)) { 688703b705cfSriastradh DBG(("%s: converting request for GTT map into CPU map\n", 688803b705cfSriastradh __FUNCTION__)); 688903b705cfSriastradh ptr = kgem_bo_map__cpu(kgem, bo); 689003b705cfSriastradh if (ptr) 689103b705cfSriastradh kgem_bo_sync__cpu(kgem, bo); 689203b705cfSriastradh return ptr; 689303b705cfSriastradh } 689403b705cfSriastradh 6895813957e3Ssnj ptr = __kgem_bo_map__gtt_or_wc(kgem, bo); 689603b705cfSriastradh 689703b705cfSriastradh if (bo->domain != DOMAIN_GTT || FORCE_MMAP_SYNC & (1 << DOMAIN_GTT)) { 689803b705cfSriastradh struct drm_i915_gem_set_domain set_domain; 689903b705cfSriastradh 690003b705cfSriastradh DBG(("%s: sync: needs_flush? %d, domain? %d, busy? %d\n", __FUNCTION__, 690103b705cfSriastradh bo->needs_flush, bo->domain, __kgem_busy(kgem, bo->handle))); 690203b705cfSriastradh 690303b705cfSriastradh /* XXX use PROT_READ to avoid the write flush? */ 690403b705cfSriastradh 690503b705cfSriastradh VG_CLEAR(set_domain); 690603b705cfSriastradh set_domain.handle = bo->handle; 690703b705cfSriastradh set_domain.read_domains = I915_GEM_DOMAIN_GTT; 690803b705cfSriastradh set_domain.write_domain = I915_GEM_DOMAIN_GTT; 69099a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) { 69109a906b70Schristos DBG(("%s: sync: GPU hang detected\n", __FUNCTION__)); 69119a906b70Schristos kgem_throttle(kgem); 691203b705cfSriastradh } 691363ef14f0Smrg bo->needs_flush = false; 69149a906b70Schristos kgem_bo_retire(kgem, bo); 69159a906b70Schristos bo->domain = DOMAIN_GTT; 69169a906b70Schristos bo->gtt_dirty = true; 691703b705cfSriastradh } 691803b705cfSriastradh 691903b705cfSriastradh return ptr; 692003b705cfSriastradh} 692103b705cfSriastradh 692203b705cfSriastradhvoid *kgem_bo_map__gtt(struct kgem *kgem, struct kgem_bo *bo) 692303b705cfSriastradh{ 69249a906b70Schristos DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__, 69259a906b70Schristos bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain)); 692603b705cfSriastradh 69279a906b70Schristos assert(bo->proxy == NULL); 692803b705cfSriastradh assert(bo->exec == NULL); 692903b705cfSriastradh assert(list_is_empty(&bo->list)); 693003b705cfSriastradh assert_tiling(kgem, bo); 69319a906b70Schristos assert(!bo->purged || bo->reusable); 693203b705cfSriastradh 6933813957e3Ssnj return __kgem_bo_map__gtt_or_wc(kgem, bo); 6934813957e3Ssnj} 693503b705cfSriastradh 6936813957e3Ssnjvoid *kgem_bo_map__wc(struct kgem *kgem, struct kgem_bo *bo) 6937813957e3Ssnj{ 6938813957e3Ssnj DBG(("%s: handle=%d, offset=%ld, tiling=%d, map=%p:%p, domain=%d\n", __FUNCTION__, 6939813957e3Ssnj bo->handle, (long)bo->presumed_offset, bo->tiling, bo->map__gtt, bo->map__cpu, bo->domain)); 694003b705cfSriastradh 6941813957e3Ssnj assert(bo->proxy == NULL); 6942813957e3Ssnj assert(list_is_empty(&bo->list)); 6943813957e3Ssnj assert_tiling(kgem, bo); 6944813957e3Ssnj assert(!bo->purged || bo->reusable); 694503b705cfSriastradh 6946813957e3Ssnj if (bo->map__wc) 6947813957e3Ssnj return bo->map__wc; 694863ef14f0Smrg if (!kgem->has_wc_mmap) 694963ef14f0Smrg return NULL; 695003b705cfSriastradh 695163ef14f0Smrg kgem_trim_vma_cache(kgem, MAP_GTT, bucket(bo)); 6952813957e3Ssnj return __kgem_bo_map__wc(kgem, bo); 695303b705cfSriastradh} 695403b705cfSriastradh 695503b705cfSriastradhvoid *kgem_bo_map__cpu(struct kgem *kgem, struct kgem_bo *bo) 695603b705cfSriastradh{ 69579a906b70Schristos DBG(("%s(handle=%d, size=%d, map=%p:%p)\n", 69589a906b70Schristos __FUNCTION__, bo->handle, bytes(bo), bo->map__gtt, bo->map__cpu)); 695903b705cfSriastradh assert(!bo->purged); 696003b705cfSriastradh assert(list_is_empty(&bo->list)); 696103b705cfSriastradh assert(bo->proxy == NULL); 69629a906b70Schristos assert_tiling(kgem, bo); 696303b705cfSriastradh 69649a906b70Schristos if (bo->map__cpu) 69659a906b70Schristos return MAP(bo->map__cpu); 696603b705cfSriastradh 696703b705cfSriastradh kgem_trim_vma_cache(kgem, MAP_CPU, bucket(bo)); 696803b705cfSriastradh 6969813957e3Ssnj return __kgem_bo_map__cpu(kgem, bo); 6970813957e3Ssnj} 697103b705cfSriastradh 6972813957e3Ssnjvoid *kgem_bo_map__debug(struct kgem *kgem, struct kgem_bo *bo) 6973813957e3Ssnj{ 6974813957e3Ssnj void *ptr; 697503b705cfSriastradh 6976813957e3Ssnj if (bo->tiling == I915_TILING_NONE && kgem->has_llc) { 6977813957e3Ssnj ptr = MAP(bo->map__cpu); 6978813957e3Ssnj if (ptr == NULL) 6979813957e3Ssnj ptr = __kgem_bo_map__cpu(kgem, bo); 6980813957e3Ssnj } else if (bo->tiling || !kgem->has_wc_mmap) { 6981813957e3Ssnj ptr = bo->map__gtt; 6982813957e3Ssnj if (ptr == NULL) 6983813957e3Ssnj ptr = __kgem_bo_map__gtt(kgem, bo); 6984813957e3Ssnj } else { 6985813957e3Ssnj ptr = bo->map__wc; 6986813957e3Ssnj if (ptr == NULL) 6987813957e3Ssnj ptr = __kgem_bo_map__wc(kgem, bo); 698803b705cfSriastradh } 698903b705cfSriastradh 6990813957e3Ssnj return ptr; 699103b705cfSriastradh} 699203b705cfSriastradh 6993813957e3Ssnj 699403b705cfSriastradhuint32_t kgem_bo_flink(struct kgem *kgem, struct kgem_bo *bo) 699503b705cfSriastradh{ 699603b705cfSriastradh struct drm_gem_flink flink; 699703b705cfSriastradh 699863ef14f0Smrg assert(kgem_bo_is_fenced(kgem, bo)); 699963ef14f0Smrg 700003b705cfSriastradh VG_CLEAR(flink); 700103b705cfSriastradh flink.handle = bo->handle; 70029a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_GEM_FLINK, &flink)) 700303b705cfSriastradh return 0; 700403b705cfSriastradh 700503b705cfSriastradh DBG(("%s: flinked handle=%d to name=%d, marking non-reusable\n", 700603b705cfSriastradh __FUNCTION__, flink.handle, flink.name)); 700703b705cfSriastradh 700803b705cfSriastradh /* Ordinarily giving the name aware makes the buffer non-reusable. 700903b705cfSriastradh * However, we track the lifetime of all clients and their hold 701003b705cfSriastradh * on the buffer, and *presuming* they do not pass it on to a third 701103b705cfSriastradh * party, we track the lifetime accurately. 701203b705cfSriastradh */ 701303b705cfSriastradh bo->reusable = false; 701403b705cfSriastradh kgem_bo_unclean(kgem, bo); 701503b705cfSriastradh 701603b705cfSriastradh return flink.name; 701703b705cfSriastradh} 701803b705cfSriastradh 701903b705cfSriastradhstruct kgem_bo *kgem_create_map(struct kgem *kgem, 702003b705cfSriastradh void *ptr, uint32_t size, 702103b705cfSriastradh bool read_only) 702203b705cfSriastradh{ 702303b705cfSriastradh struct kgem_bo *bo; 702403b705cfSriastradh uintptr_t first_page, last_page; 702503b705cfSriastradh uint32_t handle; 702603b705cfSriastradh 702703b705cfSriastradh assert(MAP(ptr) == ptr); 702803b705cfSriastradh 70299a906b70Schristos DBG(("%s(%p size=%d, read-only?=%d) - has_userptr?=%d\n", __FUNCTION__, 70309a906b70Schristos ptr, size, read_only, kgem->has_userptr)); 703103b705cfSriastradh if (!kgem->has_userptr) 703203b705cfSriastradh return NULL; 703303b705cfSriastradh 703403b705cfSriastradh first_page = (uintptr_t)ptr; 703503b705cfSriastradh last_page = first_page + size + PAGE_SIZE - 1; 703603b705cfSriastradh 703763ef14f0Smrg first_page &= ~(uintptr_t)(PAGE_SIZE-1); 703863ef14f0Smrg last_page &= ~(uintptr_t)(PAGE_SIZE-1); 703903b705cfSriastradh assert(last_page > first_page); 704003b705cfSriastradh 704103b705cfSriastradh handle = gem_userptr(kgem->fd, 704203b705cfSriastradh (void *)first_page, last_page-first_page, 704303b705cfSriastradh read_only); 70449a906b70Schristos if (handle == 0) { 704563ef14f0Smrg if (read_only && kgem->has_wc_mmap) { 704663ef14f0Smrg struct drm_i915_gem_set_domain set_domain; 704763ef14f0Smrg 704863ef14f0Smrg handle = gem_userptr(kgem->fd, 704963ef14f0Smrg (void *)first_page, last_page-first_page, 705063ef14f0Smrg false); 705163ef14f0Smrg 705263ef14f0Smrg VG_CLEAR(set_domain); 705363ef14f0Smrg set_domain.handle = handle; 705463ef14f0Smrg set_domain.read_domains = I915_GEM_DOMAIN_GTT; 705563ef14f0Smrg set_domain.write_domain = 0; 705663ef14f0Smrg if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) { 705763ef14f0Smrg gem_close(kgem->fd, handle); 705863ef14f0Smrg handle = 0; 705963ef14f0Smrg } 706063ef14f0Smrg } 706163ef14f0Smrg if (handle == 0) { 706263ef14f0Smrg DBG(("%s: import failed, errno=%d\n", __FUNCTION__, errno)); 706363ef14f0Smrg return NULL; 706463ef14f0Smrg } 70659a906b70Schristos } 706603b705cfSriastradh 706703b705cfSriastradh bo = __kgem_bo_alloc(handle, (last_page - first_page) / PAGE_SIZE); 706803b705cfSriastradh if (bo == NULL) { 706903b705cfSriastradh gem_close(kgem->fd, handle); 707003b705cfSriastradh return NULL; 707103b705cfSriastradh } 707203b705cfSriastradh 70739a906b70Schristos bo->unique_id = kgem_get_unique_id(kgem); 707403b705cfSriastradh bo->snoop = !kgem->has_llc; 707503b705cfSriastradh debug_alloc__bo(kgem, bo); 707603b705cfSriastradh 707703b705cfSriastradh if (first_page != (uintptr_t)ptr) { 707803b705cfSriastradh struct kgem_bo *proxy; 707903b705cfSriastradh 708003b705cfSriastradh proxy = kgem_create_proxy(kgem, bo, 708103b705cfSriastradh (uintptr_t)ptr - first_page, size); 708203b705cfSriastradh kgem_bo_destroy(kgem, bo); 708303b705cfSriastradh if (proxy == NULL) 708403b705cfSriastradh return NULL; 708503b705cfSriastradh 708603b705cfSriastradh bo = proxy; 708703b705cfSriastradh } 708803b705cfSriastradh 70899a906b70Schristos bo->map__cpu = MAKE_USER_MAP(ptr); 709003b705cfSriastradh 709103b705cfSriastradh DBG(("%s(ptr=%p, size=%d, pages=%d, read_only=%d) => handle=%d (proxy? %d)\n", 709203b705cfSriastradh __FUNCTION__, ptr, size, NUM_PAGES(size), read_only, handle, bo->proxy != NULL)); 709303b705cfSriastradh return bo; 709403b705cfSriastradh} 709503b705cfSriastradh 709603b705cfSriastradhvoid kgem_bo_sync__cpu(struct kgem *kgem, struct kgem_bo *bo) 709703b705cfSriastradh{ 709803b705cfSriastradh DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle)); 709903b705cfSriastradh assert(!bo->scanout); 71009a906b70Schristos assert_tiling(kgem, bo); 71019a906b70Schristos 710203b705cfSriastradh kgem_bo_submit(kgem, bo); 710303b705cfSriastradh 710403b705cfSriastradh /* SHM pixmaps use proxies for subpage offsets */ 710503b705cfSriastradh assert(!bo->purged); 710603b705cfSriastradh while (bo->proxy) 710703b705cfSriastradh bo = bo->proxy; 710803b705cfSriastradh assert(!bo->purged); 710903b705cfSriastradh 711003b705cfSriastradh if (bo->domain != DOMAIN_CPU || FORCE_MMAP_SYNC & (1 << DOMAIN_CPU)) { 711103b705cfSriastradh struct drm_i915_gem_set_domain set_domain; 711203b705cfSriastradh 711303b705cfSriastradh DBG(("%s: SYNC: handle=%d, needs_flush? %d, domain? %d, busy? %d\n", 711403b705cfSriastradh __FUNCTION__, bo->handle, 711503b705cfSriastradh bo->needs_flush, bo->domain, 711603b705cfSriastradh __kgem_busy(kgem, bo->handle))); 711703b705cfSriastradh 711803b705cfSriastradh VG_CLEAR(set_domain); 711903b705cfSriastradh set_domain.handle = bo->handle; 712003b705cfSriastradh set_domain.read_domains = I915_GEM_DOMAIN_CPU; 712103b705cfSriastradh set_domain.write_domain = I915_GEM_DOMAIN_CPU; 712203b705cfSriastradh 71239a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) { 71249a906b70Schristos DBG(("%s: sync: GPU hang detected\n", __FUNCTION__)); 71259a906b70Schristos kgem_throttle(kgem); 712603b705cfSriastradh } 712763ef14f0Smrg bo->needs_flush = false; 71289a906b70Schristos kgem_bo_retire(kgem, bo); 71299a906b70Schristos bo->domain = DOMAIN_CPU; 713063ef14f0Smrg bo->gtt_dirty = true; 713103b705cfSriastradh } 713203b705cfSriastradh} 713303b705cfSriastradh 713403b705cfSriastradhvoid kgem_bo_sync__cpu_full(struct kgem *kgem, struct kgem_bo *bo, bool write) 713503b705cfSriastradh{ 713603b705cfSriastradh DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle)); 713703b705cfSriastradh assert(!bo->scanout || !write); 71389a906b70Schristos assert_tiling(kgem, bo); 713903b705cfSriastradh 714003b705cfSriastradh if (write || bo->needs_flush) 714103b705cfSriastradh kgem_bo_submit(kgem, bo); 714203b705cfSriastradh 714303b705cfSriastradh /* SHM pixmaps use proxies for subpage offsets */ 714403b705cfSriastradh assert(!bo->purged); 714503b705cfSriastradh assert(bo->refcnt); 714603b705cfSriastradh while (bo->proxy) 714703b705cfSriastradh bo = bo->proxy; 714803b705cfSriastradh assert(bo->refcnt); 714903b705cfSriastradh assert(!bo->purged); 715003b705cfSriastradh 715163ef14f0Smrg if (bo->rq == NULL && (kgem->has_llc || bo->snoop) && !write) 715263ef14f0Smrg return; 715363ef14f0Smrg 715403b705cfSriastradh if (bo->domain != DOMAIN_CPU || FORCE_MMAP_SYNC & (1 << DOMAIN_CPU)) { 715503b705cfSriastradh struct drm_i915_gem_set_domain set_domain; 715603b705cfSriastradh 715703b705cfSriastradh DBG(("%s: SYNC: handle=%d, needs_flush? %d, domain? %d, busy? %d\n", 715803b705cfSriastradh __FUNCTION__, bo->handle, 715903b705cfSriastradh bo->needs_flush, bo->domain, 716003b705cfSriastradh __kgem_busy(kgem, bo->handle))); 716103b705cfSriastradh 716203b705cfSriastradh VG_CLEAR(set_domain); 716303b705cfSriastradh set_domain.handle = bo->handle; 716403b705cfSriastradh set_domain.read_domains = I915_GEM_DOMAIN_CPU; 716503b705cfSriastradh set_domain.write_domain = write ? I915_GEM_DOMAIN_CPU : 0; 716603b705cfSriastradh 71679a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) { 71689a906b70Schristos DBG(("%s: sync: GPU hang detected\n", __FUNCTION__)); 71699a906b70Schristos kgem_throttle(kgem); 71709a906b70Schristos } 717163ef14f0Smrg bo->needs_flush = false; 71729a906b70Schristos if (write) { 71739a906b70Schristos kgem_bo_retire(kgem, bo); 71749a906b70Schristos bo->domain = DOMAIN_CPU; 717563ef14f0Smrg bo->gtt_dirty = true; 71769a906b70Schristos } else { 717703b705cfSriastradh if (bo->exec == NULL) 71789a906b70Schristos kgem_bo_maybe_retire(kgem, bo); 71799a906b70Schristos bo->domain = DOMAIN_NONE; 718003b705cfSriastradh } 718103b705cfSriastradh } 718203b705cfSriastradh} 718303b705cfSriastradh 718403b705cfSriastradhvoid kgem_bo_sync__gtt(struct kgem *kgem, struct kgem_bo *bo) 718503b705cfSriastradh{ 718603b705cfSriastradh DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle)); 718703b705cfSriastradh assert(bo->refcnt); 718803b705cfSriastradh assert(bo->proxy == NULL); 71899a906b70Schristos assert_tiling(kgem, bo); 719063ef14f0Smrg assert(!bo->snoop); 719103b705cfSriastradh 719203b705cfSriastradh kgem_bo_submit(kgem, bo); 719303b705cfSriastradh 719463ef14f0Smrg if (bo->domain != DOMAIN_GTT || 719563ef14f0Smrg !kgem->has_coherent_mmap_gtt || 719663ef14f0Smrg FORCE_MMAP_SYNC & (1 << DOMAIN_GTT)) { 719703b705cfSriastradh struct drm_i915_gem_set_domain set_domain; 719803b705cfSriastradh 719903b705cfSriastradh DBG(("%s: SYNC: handle=%d, needs_flush? %d, domain? %d, busy? %d\n", 720003b705cfSriastradh __FUNCTION__, bo->handle, 720103b705cfSriastradh bo->needs_flush, bo->domain, 720203b705cfSriastradh __kgem_busy(kgem, bo->handle))); 720303b705cfSriastradh 720403b705cfSriastradh VG_CLEAR(set_domain); 720503b705cfSriastradh set_domain.handle = bo->handle; 720603b705cfSriastradh set_domain.read_domains = I915_GEM_DOMAIN_GTT; 720703b705cfSriastradh set_domain.write_domain = I915_GEM_DOMAIN_GTT; 720803b705cfSriastradh 72099a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) { 72109a906b70Schristos DBG(("%s: sync: GPU hang detected\n", __FUNCTION__)); 72119a906b70Schristos kgem_throttle(kgem); 721203b705cfSriastradh } 721363ef14f0Smrg bo->needs_flush = false; 72149a906b70Schristos kgem_bo_retire(kgem, bo); 72159a906b70Schristos bo->domain = DOMAIN_GTT; 72169a906b70Schristos bo->gtt_dirty = true; 721703b705cfSriastradh } 721803b705cfSriastradh} 721903b705cfSriastradh 722003b705cfSriastradhvoid kgem_clear_dirty(struct kgem *kgem) 722103b705cfSriastradh{ 722203b705cfSriastradh struct list * const buffers = &kgem->next_request->buffers; 722303b705cfSriastradh struct kgem_bo *bo; 722403b705cfSriastradh 722503b705cfSriastradh list_for_each_entry(bo, buffers, request) { 722603b705cfSriastradh if (!bo->gpu_dirty) 722703b705cfSriastradh break; 722803b705cfSriastradh 722903b705cfSriastradh bo->gpu_dirty = false; 723003b705cfSriastradh } 723103b705cfSriastradh} 723203b705cfSriastradh 723303b705cfSriastradhstruct kgem_bo *kgem_create_proxy(struct kgem *kgem, 723403b705cfSriastradh struct kgem_bo *target, 723503b705cfSriastradh int offset, int length) 723603b705cfSriastradh{ 723703b705cfSriastradh struct kgem_bo *bo; 723803b705cfSriastradh 723903b705cfSriastradh DBG(("%s: target handle=%d [proxy? %d], offset=%d, length=%d, io=%d\n", 724003b705cfSriastradh __FUNCTION__, target->handle, target->proxy ? target->proxy->delta : -1, 724103b705cfSriastradh offset, length, target->io)); 724203b705cfSriastradh 724303b705cfSriastradh bo = __kgem_bo_alloc(target->handle, length); 724403b705cfSriastradh if (bo == NULL) 724503b705cfSriastradh return NULL; 724603b705cfSriastradh 724703b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 724803b705cfSriastradh bo->reusable = false; 724903b705cfSriastradh bo->size.bytes = length; 725003b705cfSriastradh 725103b705cfSriastradh bo->io = target->io && target->proxy == NULL; 725203b705cfSriastradh bo->gpu_dirty = target->gpu_dirty; 725303b705cfSriastradh bo->tiling = target->tiling; 725403b705cfSriastradh bo->pitch = target->pitch; 725503b705cfSriastradh bo->flush = target->flush; 725603b705cfSriastradh bo->snoop = target->snoop; 725703b705cfSriastradh 725803b705cfSriastradh assert(!bo->scanout); 725903b705cfSriastradh bo->proxy = kgem_bo_reference(target); 726003b705cfSriastradh bo->delta = offset; 726103b705cfSriastradh 72629a906b70Schristos /* Proxies are only tracked for busyness on the current rq */ 72639a906b70Schristos if (target->exec && !bo->io) { 72649a906b70Schristos assert(RQ(target->rq) == kgem->next_request); 726503b705cfSriastradh list_move_tail(&bo->request, &kgem->next_request->buffers); 726603b705cfSriastradh bo->exec = &_kgem_dummy_exec; 72679a906b70Schristos bo->rq = target->rq; 726803b705cfSriastradh } 726903b705cfSriastradh 727003b705cfSriastradh return bo; 727103b705cfSriastradh} 727203b705cfSriastradh 727303b705cfSriastradhstatic struct kgem_buffer * 727403b705cfSriastradhbuffer_alloc(void) 727503b705cfSriastradh{ 727603b705cfSriastradh struct kgem_buffer *bo; 727703b705cfSriastradh 727803b705cfSriastradh bo = malloc(sizeof(*bo)); 727903b705cfSriastradh if (bo == NULL) 728003b705cfSriastradh return NULL; 728103b705cfSriastradh 728203b705cfSriastradh bo->mem = NULL; 728303b705cfSriastradh bo->need_io = false; 72849a906b70Schristos bo->mmapped = MMAPPED_CPU; 728503b705cfSriastradh 728603b705cfSriastradh return bo; 728703b705cfSriastradh} 728803b705cfSriastradh 728903b705cfSriastradhstatic struct kgem_buffer * 729003b705cfSriastradhbuffer_alloc_with_data(int num_pages) 729103b705cfSriastradh{ 729203b705cfSriastradh struct kgem_buffer *bo; 729303b705cfSriastradh 729403b705cfSriastradh bo = malloc(sizeof(*bo) + 2*UPLOAD_ALIGNMENT + num_pages * PAGE_SIZE); 729503b705cfSriastradh if (bo == NULL) 729603b705cfSriastradh return NULL; 729703b705cfSriastradh 729803b705cfSriastradh bo->mem = (void *)ALIGN((uintptr_t)bo + sizeof(*bo), UPLOAD_ALIGNMENT); 729903b705cfSriastradh bo->mmapped = false; 730003b705cfSriastradh return bo; 730103b705cfSriastradh} 730203b705cfSriastradh 730303b705cfSriastradhstatic inline bool 730403b705cfSriastradhuse_snoopable_buffer(struct kgem *kgem, uint32_t flags) 730503b705cfSriastradh{ 730603b705cfSriastradh if ((flags & KGEM_BUFFER_WRITE) == 0) 730703b705cfSriastradh return kgem->gen >= 030; 730803b705cfSriastradh 730903b705cfSriastradh return true; 731003b705cfSriastradh} 731103b705cfSriastradh 731203b705cfSriastradhstatic void 731303b705cfSriastradhinit_buffer_from_bo(struct kgem_buffer *bo, struct kgem_bo *old) 731403b705cfSriastradh{ 731503b705cfSriastradh DBG(("%s: reusing handle=%d for buffer\n", 731603b705cfSriastradh __FUNCTION__, old->handle)); 731703b705cfSriastradh 731803b705cfSriastradh assert(old->proxy == NULL); 7319813957e3Ssnj assert(list_is_empty(&old->list)); 732003b705cfSriastradh 732103b705cfSriastradh memcpy(&bo->base, old, sizeof(*old)); 732203b705cfSriastradh if (old->rq) 732303b705cfSriastradh list_replace(&old->request, &bo->base.request); 732403b705cfSriastradh else 732503b705cfSriastradh list_init(&bo->base.request); 732603b705cfSriastradh list_replace(&old->vma, &bo->base.vma); 732703b705cfSriastradh list_init(&bo->base.list); 732803b705cfSriastradh free(old); 732903b705cfSriastradh 733003b705cfSriastradh assert(bo->base.tiling == I915_TILING_NONE); 733103b705cfSriastradh 733203b705cfSriastradh bo->base.refcnt = 1; 733303b705cfSriastradh} 733403b705cfSriastradh 733503b705cfSriastradhstatic struct kgem_buffer * 733603b705cfSriastradhsearch_snoopable_buffer(struct kgem *kgem, unsigned alloc) 733703b705cfSriastradh{ 733803b705cfSriastradh struct kgem_buffer *bo; 733903b705cfSriastradh struct kgem_bo *old; 734003b705cfSriastradh 734103b705cfSriastradh old = search_snoop_cache(kgem, alloc, 0); 734203b705cfSriastradh if (old) { 734303b705cfSriastradh if (!old->io) { 734403b705cfSriastradh bo = buffer_alloc(); 734503b705cfSriastradh if (bo == NULL) 734603b705cfSriastradh return NULL; 734703b705cfSriastradh 734803b705cfSriastradh init_buffer_from_bo(bo, old); 734903b705cfSriastradh } else { 735003b705cfSriastradh bo = (struct kgem_buffer *)old; 735103b705cfSriastradh bo->base.refcnt = 1; 735203b705cfSriastradh } 735303b705cfSriastradh 735403b705cfSriastradh DBG(("%s: created CPU handle=%d for buffer, size %d\n", 735503b705cfSriastradh __FUNCTION__, bo->base.handle, num_pages(&bo->base))); 735603b705cfSriastradh 735703b705cfSriastradh assert(bo->base.snoop); 735803b705cfSriastradh assert(bo->base.tiling == I915_TILING_NONE); 735903b705cfSriastradh assert(num_pages(&bo->base) >= alloc); 73609a906b70Schristos assert(bo->mmapped == MMAPPED_CPU); 736103b705cfSriastradh assert(bo->need_io == false); 736203b705cfSriastradh 736303b705cfSriastradh bo->mem = kgem_bo_map__cpu(kgem, &bo->base); 736403b705cfSriastradh if (bo->mem == NULL) { 736503b705cfSriastradh bo->base.refcnt = 0; 736603b705cfSriastradh kgem_bo_free(kgem, &bo->base); 736703b705cfSriastradh bo = NULL; 736803b705cfSriastradh } 736903b705cfSriastradh 737003b705cfSriastradh return bo; 737103b705cfSriastradh } 737203b705cfSriastradh 737303b705cfSriastradh return NULL; 737403b705cfSriastradh} 737503b705cfSriastradh 737603b705cfSriastradhstatic struct kgem_buffer * 737703b705cfSriastradhcreate_snoopable_buffer(struct kgem *kgem, unsigned alloc) 737803b705cfSriastradh{ 737903b705cfSriastradh struct kgem_buffer *bo; 738003b705cfSriastradh uint32_t handle; 738103b705cfSriastradh 738203b705cfSriastradh if (kgem->has_llc) { 738303b705cfSriastradh struct kgem_bo *old; 738403b705cfSriastradh 738503b705cfSriastradh bo = buffer_alloc(); 738603b705cfSriastradh if (bo == NULL) 738703b705cfSriastradh return NULL; 738803b705cfSriastradh 738903b705cfSriastradh old = search_linear_cache(kgem, alloc, 739003b705cfSriastradh CREATE_INACTIVE | CREATE_CPU_MAP | CREATE_EXACT); 739103b705cfSriastradh if (old) { 739203b705cfSriastradh init_buffer_from_bo(bo, old); 739303b705cfSriastradh } else { 739403b705cfSriastradh handle = gem_create(kgem->fd, alloc); 739503b705cfSriastradh if (handle == 0) { 739603b705cfSriastradh free(bo); 739703b705cfSriastradh return NULL; 739803b705cfSriastradh } 739903b705cfSriastradh 740003b705cfSriastradh __kgem_bo_init(&bo->base, handle, alloc); 74019a906b70Schristos debug_alloc__bo(kgem, &bo->base); 740203b705cfSriastradh DBG(("%s: created CPU (LLC) handle=%d for buffer, size %d\n", 740303b705cfSriastradh __FUNCTION__, bo->base.handle, alloc)); 740403b705cfSriastradh } 740503b705cfSriastradh 740603b705cfSriastradh assert(bo->base.refcnt == 1); 74079a906b70Schristos assert(bo->mmapped == MMAPPED_CPU); 740803b705cfSriastradh assert(bo->need_io == false); 740903b705cfSriastradh 741003b705cfSriastradh bo->mem = kgem_bo_map__cpu(kgem, &bo->base); 741103b705cfSriastradh if (bo->mem != NULL) 741203b705cfSriastradh return bo; 741303b705cfSriastradh 741403b705cfSriastradh bo->base.refcnt = 0; /* for valgrind */ 741503b705cfSriastradh kgem_bo_free(kgem, &bo->base); 741603b705cfSriastradh } 741703b705cfSriastradh 741803b705cfSriastradh if (kgem->has_caching) { 741903b705cfSriastradh struct kgem_bo *old; 742003b705cfSriastradh 742103b705cfSriastradh bo = buffer_alloc(); 742203b705cfSriastradh if (bo == NULL) 742303b705cfSriastradh return NULL; 742403b705cfSriastradh 742503b705cfSriastradh old = search_linear_cache(kgem, alloc, 742603b705cfSriastradh CREATE_INACTIVE | CREATE_CPU_MAP | CREATE_EXACT); 742703b705cfSriastradh if (old) { 742803b705cfSriastradh init_buffer_from_bo(bo, old); 742903b705cfSriastradh } else { 743003b705cfSriastradh handle = gem_create(kgem->fd, alloc); 743103b705cfSriastradh if (handle == 0) { 743203b705cfSriastradh free(bo); 743303b705cfSriastradh return NULL; 743403b705cfSriastradh } 743503b705cfSriastradh 743603b705cfSriastradh __kgem_bo_init(&bo->base, handle, alloc); 74379a906b70Schristos debug_alloc__bo(kgem, &bo->base); 743803b705cfSriastradh DBG(("%s: created CPU handle=%d for buffer, size %d\n", 743903b705cfSriastradh __FUNCTION__, bo->base.handle, alloc)); 744003b705cfSriastradh } 744103b705cfSriastradh 744203b705cfSriastradh assert(bo->base.refcnt == 1); 74439a906b70Schristos assert(bo->mmapped == MMAPPED_CPU); 744403b705cfSriastradh assert(bo->need_io == false); 7445813957e3Ssnj assert(!__kgem_busy(kgem, bo->base.handle)); 744603b705cfSriastradh 744703b705cfSriastradh if (!gem_set_caching(kgem->fd, bo->base.handle, SNOOPED)) 744803b705cfSriastradh goto free_caching; 744903b705cfSriastradh 745003b705cfSriastradh bo->base.snoop = true; 745103b705cfSriastradh 745203b705cfSriastradh bo->mem = kgem_bo_map__cpu(kgem, &bo->base); 745303b705cfSriastradh if (bo->mem == NULL) 745403b705cfSriastradh goto free_caching; 745503b705cfSriastradh 745603b705cfSriastradh return bo; 745703b705cfSriastradh 745803b705cfSriastradhfree_caching: 745903b705cfSriastradh bo->base.refcnt = 0; /* for valgrind */ 746003b705cfSriastradh kgem_bo_free(kgem, &bo->base); 746103b705cfSriastradh } 746203b705cfSriastradh 746303b705cfSriastradh if (kgem->has_userptr) { 746403b705cfSriastradh bo = buffer_alloc(); 746503b705cfSriastradh if (bo == NULL) 746603b705cfSriastradh return NULL; 746703b705cfSriastradh 746803b705cfSriastradh //if (posix_memalign(&ptr, 64, ALIGN(size, 64))) 746903b705cfSriastradh if (posix_memalign(&bo->mem, PAGE_SIZE, alloc * PAGE_SIZE)) { 747003b705cfSriastradh free(bo); 747103b705cfSriastradh return NULL; 747203b705cfSriastradh } 747303b705cfSriastradh 747403b705cfSriastradh handle = gem_userptr(kgem->fd, bo->mem, alloc * PAGE_SIZE, false); 747503b705cfSriastradh if (handle == 0) { 747603b705cfSriastradh free(bo->mem); 747703b705cfSriastradh free(bo); 747803b705cfSriastradh return NULL; 747903b705cfSriastradh } 748003b705cfSriastradh 748103b705cfSriastradh __kgem_bo_init(&bo->base, handle, alloc); 74829a906b70Schristos debug_alloc__bo(kgem, &bo->base); 748303b705cfSriastradh DBG(("%s: created snoop handle=%d for buffer\n", 748403b705cfSriastradh __FUNCTION__, bo->base.handle)); 748503b705cfSriastradh 74869a906b70Schristos assert(bo->mmapped == MMAPPED_CPU); 748703b705cfSriastradh assert(bo->need_io == false); 748803b705cfSriastradh 748903b705cfSriastradh bo->base.refcnt = 1; 749003b705cfSriastradh bo->base.snoop = true; 74919a906b70Schristos bo->base.map__cpu = MAKE_USER_MAP(bo->mem); 749203b705cfSriastradh 749303b705cfSriastradh return bo; 749403b705cfSriastradh } 749503b705cfSriastradh 749603b705cfSriastradh return NULL; 749703b705cfSriastradh} 749803b705cfSriastradh 749903b705cfSriastradhstruct kgem_bo *kgem_create_buffer(struct kgem *kgem, 750003b705cfSriastradh uint32_t size, uint32_t flags, 750103b705cfSriastradh void **ret) 750203b705cfSriastradh{ 750303b705cfSriastradh struct kgem_buffer *bo; 750403b705cfSriastradh unsigned offset, alloc; 750503b705cfSriastradh struct kgem_bo *old; 750603b705cfSriastradh 750703b705cfSriastradh DBG(("%s: size=%d, flags=%x [write?=%d, inplace?=%d, last?=%d]\n", 750803b705cfSriastradh __FUNCTION__, size, flags, 750903b705cfSriastradh !!(flags & KGEM_BUFFER_WRITE), 751003b705cfSriastradh !!(flags & KGEM_BUFFER_INPLACE), 751103b705cfSriastradh !!(flags & KGEM_BUFFER_LAST))); 751203b705cfSriastradh assert(size); 751303b705cfSriastradh /* we should never be asked to create anything TOO large */ 751403b705cfSriastradh assert(size <= kgem->max_object_size); 751503b705cfSriastradh 751603b705cfSriastradh#if !DBG_NO_UPLOAD_CACHE 751703b705cfSriastradh list_for_each_entry(bo, &kgem->batch_buffers, base.list) { 751803b705cfSriastradh assert(bo->base.io); 751903b705cfSriastradh assert(bo->base.refcnt >= 1); 752003b705cfSriastradh 752103b705cfSriastradh /* We can reuse any write buffer which we can fit */ 752203b705cfSriastradh if (flags == KGEM_BUFFER_LAST && 752303b705cfSriastradh bo->write == KGEM_BUFFER_WRITE && 75249a906b70Schristos bo->base.refcnt == 1 && 75259a906b70Schristos bo->mmapped == MMAPPED_NONE && 752603b705cfSriastradh size <= bytes(&bo->base)) { 752703b705cfSriastradh DBG(("%s: reusing write buffer for read of %d bytes? used=%d, total=%d\n", 752803b705cfSriastradh __FUNCTION__, size, bo->used, bytes(&bo->base))); 75299a906b70Schristos gem_write__cachealigned(kgem->fd, bo->base.handle, 75309a906b70Schristos 0, bo->used, bo->mem); 75319a906b70Schristos assert(list_is_empty(&bo->base.vma)); 753203b705cfSriastradh bo->need_io = 0; 753303b705cfSriastradh bo->write = 0; 753403b705cfSriastradh offset = 0; 753503b705cfSriastradh bo->used = size; 753603b705cfSriastradh goto done; 753703b705cfSriastradh } 753803b705cfSriastradh 753903b705cfSriastradh if (flags & KGEM_BUFFER_WRITE) { 754003b705cfSriastradh if ((bo->write & KGEM_BUFFER_WRITE) == 0 || 754103b705cfSriastradh (((bo->write & ~flags) & KGEM_BUFFER_INPLACE) && 754203b705cfSriastradh !bo->base.snoop)) { 754303b705cfSriastradh DBG(("%s: skip write %x buffer, need %x\n", 754403b705cfSriastradh __FUNCTION__, bo->write, flags)); 754503b705cfSriastradh continue; 754603b705cfSriastradh } 754703b705cfSriastradh assert(bo->mmapped || bo->need_io); 754803b705cfSriastradh } else { 754903b705cfSriastradh if (bo->write & KGEM_BUFFER_WRITE) { 755003b705cfSriastradh DBG(("%s: skip write %x buffer, need %x\n", 755103b705cfSriastradh __FUNCTION__, bo->write, flags)); 755203b705cfSriastradh continue; 755303b705cfSriastradh } 755403b705cfSriastradh } 755503b705cfSriastradh 755603b705cfSriastradh if (bo->used + size <= bytes(&bo->base)) { 755703b705cfSriastradh DBG(("%s: reusing buffer? used=%d + size=%d, total=%d\n", 755803b705cfSriastradh __FUNCTION__, bo->used, size, bytes(&bo->base))); 755903b705cfSriastradh offset = bo->used; 756003b705cfSriastradh bo->used += size; 756103b705cfSriastradh goto done; 756203b705cfSriastradh } 756303b705cfSriastradh } 756403b705cfSriastradh 756503b705cfSriastradh if (flags & KGEM_BUFFER_WRITE) { 756603b705cfSriastradh list_for_each_entry(bo, &kgem->active_buffers, base.list) { 756703b705cfSriastradh assert(bo->base.io); 756803b705cfSriastradh assert(bo->base.refcnt >= 1); 75699a906b70Schristos assert(bo->base.exec == NULL); 757003b705cfSriastradh assert(bo->mmapped); 75719a906b70Schristos assert(bo->mmapped == MMAPPED_GTT || kgem->has_llc || bo->base.snoop); 757203b705cfSriastradh 75739a906b70Schristos if ((bo->write & ~flags) & KGEM_BUFFER_INPLACE && !bo->base.snoop) { 757403b705cfSriastradh DBG(("%s: skip write %x buffer, need %x\n", 757503b705cfSriastradh __FUNCTION__, bo->write, flags)); 757603b705cfSriastradh continue; 757703b705cfSriastradh } 757803b705cfSriastradh 757903b705cfSriastradh if (bo->used + size <= bytes(&bo->base)) { 758003b705cfSriastradh DBG(("%s: reusing buffer? used=%d + size=%d, total=%d\n", 758103b705cfSriastradh __FUNCTION__, bo->used, size, bytes(&bo->base))); 758203b705cfSriastradh offset = bo->used; 758303b705cfSriastradh bo->used += size; 758403b705cfSriastradh list_move(&bo->base.list, &kgem->batch_buffers); 758503b705cfSriastradh goto done; 758603b705cfSriastradh } 75879a906b70Schristos 75889a906b70Schristos if (bo->base.refcnt == 1 && 75899a906b70Schristos size <= bytes(&bo->base) && 75909a906b70Schristos (bo->base.rq == NULL || 75919a906b70Schristos !__kgem_busy(kgem, bo->base.handle))) { 75929a906b70Schristos DBG(("%s: reusing whole buffer? size=%d, total=%d\n", 75939a906b70Schristos __FUNCTION__, size, bytes(&bo->base))); 75949a906b70Schristos __kgem_bo_clear_busy(&bo->base); 75959a906b70Schristos assert(list_is_empty(&bo->base.vma)); 75969a906b70Schristos 75979a906b70Schristos switch (bo->mmapped) { 75989a906b70Schristos case MMAPPED_CPU: 75999a906b70Schristos kgem_bo_sync__cpu(kgem, &bo->base); 76009a906b70Schristos break; 76019a906b70Schristos case MMAPPED_GTT: 76029a906b70Schristos kgem_bo_sync__gtt(kgem, &bo->base); 76039a906b70Schristos break; 76049a906b70Schristos } 76059a906b70Schristos 76069a906b70Schristos offset = 0; 76079a906b70Schristos bo->used = size; 76089a906b70Schristos list_move(&bo->base.list, &kgem->batch_buffers); 76099a906b70Schristos goto done; 76109a906b70Schristos } 761103b705cfSriastradh } 761203b705cfSriastradh } 761303b705cfSriastradh#endif 761403b705cfSriastradh 761503b705cfSriastradh#if !DBG_NO_MAP_UPLOAD 761603b705cfSriastradh /* Be a little more generous and hope to hold fewer mmappings */ 761703b705cfSriastradh alloc = ALIGN(2*size, kgem->buffer_size); 761803b705cfSriastradh if (alloc > MAX_CACHE_SIZE) 761903b705cfSriastradh alloc = ALIGN(size, kgem->buffer_size); 762003b705cfSriastradh if (alloc > MAX_CACHE_SIZE) 762103b705cfSriastradh alloc = PAGE_ALIGN(size); 762203b705cfSriastradh assert(alloc); 762303b705cfSriastradh 76249a906b70Schristos alloc /= PAGE_SIZE; 7625813957e3Ssnj if (alloc > kgem->aperture_mappable / 4 && !kgem->has_wc_mmap) 762603b705cfSriastradh flags &= ~KGEM_BUFFER_INPLACE; 762703b705cfSriastradh 762803b705cfSriastradh if (kgem->has_llc && 762903b705cfSriastradh (flags & KGEM_BUFFER_WRITE_INPLACE) != KGEM_BUFFER_WRITE_INPLACE) { 763003b705cfSriastradh bo = buffer_alloc(); 763103b705cfSriastradh if (bo == NULL) 763203b705cfSriastradh goto skip_llc; 763303b705cfSriastradh 763403b705cfSriastradh old = NULL; 763503b705cfSriastradh if ((flags & KGEM_BUFFER_WRITE) == 0) 763603b705cfSriastradh old = search_linear_cache(kgem, alloc, CREATE_CPU_MAP); 763703b705cfSriastradh if (old == NULL) 763803b705cfSriastradh old = search_linear_cache(kgem, alloc, CREATE_INACTIVE | CREATE_CPU_MAP); 763903b705cfSriastradh if (old == NULL) 764003b705cfSriastradh old = search_linear_cache(kgem, NUM_PAGES(size), CREATE_INACTIVE | CREATE_CPU_MAP); 764103b705cfSriastradh if (old) { 764203b705cfSriastradh DBG(("%s: found LLC handle=%d for buffer\n", 764303b705cfSriastradh __FUNCTION__, old->handle)); 764403b705cfSriastradh 764503b705cfSriastradh init_buffer_from_bo(bo, old); 764603b705cfSriastradh } else { 764703b705cfSriastradh uint32_t handle = gem_create(kgem->fd, alloc); 764803b705cfSriastradh if (handle == 0) { 764903b705cfSriastradh free(bo); 765003b705cfSriastradh goto skip_llc; 765103b705cfSriastradh } 765203b705cfSriastradh __kgem_bo_init(&bo->base, handle, alloc); 76539a906b70Schristos debug_alloc__bo(kgem, &bo->base); 765403b705cfSriastradh DBG(("%s: created LLC handle=%d for buffer\n", 765503b705cfSriastradh __FUNCTION__, bo->base.handle)); 765603b705cfSriastradh } 765703b705cfSriastradh 765803b705cfSriastradh assert(bo->mmapped); 765903b705cfSriastradh assert(!bo->need_io); 766003b705cfSriastradh 766103b705cfSriastradh bo->mem = kgem_bo_map__cpu(kgem, &bo->base); 766203b705cfSriastradh if (bo->mem) { 766303b705cfSriastradh if (flags & KGEM_BUFFER_WRITE) 766403b705cfSriastradh kgem_bo_sync__cpu(kgem, &bo->base); 766503b705cfSriastradh flags &= ~KGEM_BUFFER_INPLACE; 766603b705cfSriastradh goto init; 766703b705cfSriastradh } else { 766803b705cfSriastradh bo->base.refcnt = 0; /* for valgrind */ 766903b705cfSriastradh kgem_bo_free(kgem, &bo->base); 767003b705cfSriastradh } 767103b705cfSriastradh } 767203b705cfSriastradhskip_llc: 767303b705cfSriastradh 767403b705cfSriastradh if ((flags & KGEM_BUFFER_WRITE_INPLACE) == KGEM_BUFFER_WRITE_INPLACE) { 767503b705cfSriastradh /* The issue with using a GTT upload buffer is that we may 767603b705cfSriastradh * cause eviction-stalls in order to free up some GTT space. 767703b705cfSriastradh * An is-mappable? ioctl could help us detect when we are 767803b705cfSriastradh * about to block, or some per-page magic in the kernel. 767903b705cfSriastradh * 768003b705cfSriastradh * XXX This is especially noticeable on memory constrained 768103b705cfSriastradh * devices like gen2 or with relatively slow gpu like i3. 768203b705cfSriastradh */ 768303b705cfSriastradh DBG(("%s: searching for an inactive GTT map for upload\n", 768403b705cfSriastradh __FUNCTION__)); 768503b705cfSriastradh old = search_linear_cache(kgem, alloc, 768603b705cfSriastradh CREATE_EXACT | CREATE_INACTIVE | CREATE_GTT_MAP); 768703b705cfSriastradh#if HAVE_I915_GEM_BUFFER_INFO 768803b705cfSriastradh if (old) { 768903b705cfSriastradh struct drm_i915_gem_buffer_info info; 769003b705cfSriastradh 769103b705cfSriastradh /* An example of such a non-blocking ioctl might work */ 769203b705cfSriastradh 769303b705cfSriastradh VG_CLEAR(info); 769403b705cfSriastradh info.handle = handle; 76959a906b70Schristos if (do_ioctl(kgem->fd, 769603b705cfSriastradh DRM_IOCTL_I915_GEM_BUFFER_INFO, 769703b705cfSriastradh &fino) == 0) { 769803b705cfSriastradh old->presumed_offset = info.addr; 769903b705cfSriastradh if ((info.flags & I915_GEM_MAPPABLE) == 0) { 770003b705cfSriastradh kgem_bo_move_to_inactive(kgem, old); 770103b705cfSriastradh old = NULL; 770203b705cfSriastradh } 770303b705cfSriastradh } 770403b705cfSriastradh } 770503b705cfSriastradh#endif 770603b705cfSriastradh if (old == NULL) 770703b705cfSriastradh old = search_linear_cache(kgem, NUM_PAGES(size), 770803b705cfSriastradh CREATE_EXACT | CREATE_INACTIVE | CREATE_GTT_MAP); 770903b705cfSriastradh if (old == NULL) { 771003b705cfSriastradh old = search_linear_cache(kgem, alloc, CREATE_INACTIVE); 77119a906b70Schristos if (old && !kgem_bo_can_map(kgem, old)) { 771203b705cfSriastradh _kgem_bo_destroy(kgem, old); 771303b705cfSriastradh old = NULL; 771403b705cfSriastradh } 771503b705cfSriastradh } 771603b705cfSriastradh if (old) { 771703b705cfSriastradh DBG(("%s: reusing handle=%d for buffer\n", 771803b705cfSriastradh __FUNCTION__, old->handle)); 77199a906b70Schristos assert(kgem_bo_can_map(kgem, old)); 772003b705cfSriastradh assert(!old->snoop); 772103b705cfSriastradh assert(old->rq == NULL); 772203b705cfSriastradh 772303b705cfSriastradh bo = buffer_alloc(); 772403b705cfSriastradh if (bo == NULL) 772503b705cfSriastradh return NULL; 772603b705cfSriastradh 772703b705cfSriastradh init_buffer_from_bo(bo, old); 772803b705cfSriastradh assert(num_pages(&bo->base) >= NUM_PAGES(size)); 772903b705cfSriastradh 773003b705cfSriastradh assert(bo->mmapped); 773103b705cfSriastradh assert(bo->base.refcnt == 1); 773203b705cfSriastradh 773303b705cfSriastradh bo->mem = kgem_bo_map(kgem, &bo->base); 773403b705cfSriastradh if (bo->mem) { 77359a906b70Schristos if (bo->mem == MAP(bo->base.map__cpu)) 773603b705cfSriastradh flags &= ~KGEM_BUFFER_INPLACE; 77379a906b70Schristos else 77389a906b70Schristos bo->mmapped = MMAPPED_GTT; 773903b705cfSriastradh goto init; 774003b705cfSriastradh } else { 774103b705cfSriastradh bo->base.refcnt = 0; 774203b705cfSriastradh kgem_bo_free(kgem, &bo->base); 774303b705cfSriastradh } 774403b705cfSriastradh } 774503b705cfSriastradh } 774603b705cfSriastradh#else 774703b705cfSriastradh flags &= ~KGEM_BUFFER_INPLACE; 774803b705cfSriastradh#endif 774903b705cfSriastradh /* Be more parsimonious with pwrite/pread/cacheable buffers */ 775003b705cfSriastradh if ((flags & KGEM_BUFFER_INPLACE) == 0) 775103b705cfSriastradh alloc = NUM_PAGES(size); 775203b705cfSriastradh 775303b705cfSriastradh if (use_snoopable_buffer(kgem, flags)) { 775403b705cfSriastradh bo = search_snoopable_buffer(kgem, alloc); 775503b705cfSriastradh if (bo) { 775603b705cfSriastradh if (flags & KGEM_BUFFER_WRITE) 775703b705cfSriastradh kgem_bo_sync__cpu(kgem, &bo->base); 775803b705cfSriastradh flags &= ~KGEM_BUFFER_INPLACE; 775903b705cfSriastradh goto init; 776003b705cfSriastradh } 776103b705cfSriastradh 776203b705cfSriastradh if ((flags & KGEM_BUFFER_INPLACE) == 0) { 776303b705cfSriastradh bo = create_snoopable_buffer(kgem, alloc); 776403b705cfSriastradh if (bo) 776503b705cfSriastradh goto init; 776603b705cfSriastradh } 776703b705cfSriastradh } 776803b705cfSriastradh 776903b705cfSriastradh flags &= ~KGEM_BUFFER_INPLACE; 777003b705cfSriastradh 777103b705cfSriastradh old = NULL; 777203b705cfSriastradh if ((flags & KGEM_BUFFER_WRITE) == 0) 777303b705cfSriastradh old = search_linear_cache(kgem, alloc, 0); 777403b705cfSriastradh if (old == NULL) 777503b705cfSriastradh old = search_linear_cache(kgem, alloc, CREATE_INACTIVE); 777603b705cfSriastradh if (old) { 777703b705cfSriastradh DBG(("%s: reusing ordinary handle %d for io\n", 777803b705cfSriastradh __FUNCTION__, old->handle)); 777903b705cfSriastradh bo = buffer_alloc_with_data(num_pages(old)); 778003b705cfSriastradh if (bo == NULL) 778103b705cfSriastradh return NULL; 778203b705cfSriastradh 778303b705cfSriastradh init_buffer_from_bo(bo, old); 778403b705cfSriastradh bo->need_io = flags & KGEM_BUFFER_WRITE; 778503b705cfSriastradh } else { 778603b705cfSriastradh unsigned hint; 778703b705cfSriastradh 778803b705cfSriastradh if (use_snoopable_buffer(kgem, flags)) { 778903b705cfSriastradh bo = create_snoopable_buffer(kgem, alloc); 779003b705cfSriastradh if (bo) 779103b705cfSriastradh goto init; 779203b705cfSriastradh } 779303b705cfSriastradh 779403b705cfSriastradh bo = buffer_alloc(); 779503b705cfSriastradh if (bo == NULL) 779603b705cfSriastradh return NULL; 779703b705cfSriastradh 779803b705cfSriastradh hint = CREATE_INACTIVE; 779903b705cfSriastradh if (flags & KGEM_BUFFER_WRITE) 780003b705cfSriastradh hint |= CREATE_CPU_MAP; 780103b705cfSriastradh old = search_linear_cache(kgem, alloc, hint); 780203b705cfSriastradh if (old) { 780303b705cfSriastradh DBG(("%s: reusing handle=%d for buffer\n", 780403b705cfSriastradh __FUNCTION__, old->handle)); 780503b705cfSriastradh 780603b705cfSriastradh init_buffer_from_bo(bo, old); 780703b705cfSriastradh } else { 780803b705cfSriastradh uint32_t handle = gem_create(kgem->fd, alloc); 780903b705cfSriastradh if (handle == 0) { 781003b705cfSriastradh free(bo); 781103b705cfSriastradh return NULL; 781203b705cfSriastradh } 781303b705cfSriastradh 781403b705cfSriastradh DBG(("%s: created handle=%d for buffer\n", 781503b705cfSriastradh __FUNCTION__, handle)); 781603b705cfSriastradh 781703b705cfSriastradh __kgem_bo_init(&bo->base, handle, alloc); 78189a906b70Schristos debug_alloc__bo(kgem, &bo->base); 781903b705cfSriastradh } 782003b705cfSriastradh 782103b705cfSriastradh assert(bo->mmapped); 782203b705cfSriastradh assert(!bo->need_io); 782303b705cfSriastradh assert(bo->base.refcnt == 1); 782403b705cfSriastradh 782503b705cfSriastradh if (flags & KGEM_BUFFER_WRITE) { 782603b705cfSriastradh bo->mem = kgem_bo_map__cpu(kgem, &bo->base); 782703b705cfSriastradh if (bo->mem != NULL) { 782803b705cfSriastradh kgem_bo_sync__cpu(kgem, &bo->base); 782903b705cfSriastradh goto init; 783003b705cfSriastradh } 783103b705cfSriastradh } 783203b705cfSriastradh 783303b705cfSriastradh DBG(("%s: failing back to new pwrite buffer\n", __FUNCTION__)); 783403b705cfSriastradh old = &bo->base; 783503b705cfSriastradh bo = buffer_alloc_with_data(num_pages(old)); 783603b705cfSriastradh if (bo == NULL) { 783703b705cfSriastradh old->refcnt= 0; 783803b705cfSriastradh kgem_bo_free(kgem, old); 783903b705cfSriastradh return NULL; 784003b705cfSriastradh } 784103b705cfSriastradh 784203b705cfSriastradh init_buffer_from_bo(bo, old); 784303b705cfSriastradh 784403b705cfSriastradh assert(bo->mem); 784503b705cfSriastradh assert(!bo->mmapped); 784603b705cfSriastradh assert(bo->base.refcnt == 1); 784703b705cfSriastradh 784803b705cfSriastradh bo->need_io = flags & KGEM_BUFFER_WRITE; 784903b705cfSriastradh } 785003b705cfSriastradhinit: 785103b705cfSriastradh bo->base.io = true; 785203b705cfSriastradh assert(bo->base.refcnt == 1); 785303b705cfSriastradh assert(num_pages(&bo->base) >= NUM_PAGES(size)); 785403b705cfSriastradh assert(!bo->need_io || !bo->base.needs_flush); 785503b705cfSriastradh assert(!bo->need_io || bo->base.domain != DOMAIN_GPU); 785603b705cfSriastradh assert(bo->mem); 7857813957e3Ssnj assert(bo->mmapped != MMAPPED_GTT || bo->base.map__gtt == bo->mem || bo->base.map__wc == bo->mem); 78589a906b70Schristos assert(bo->mmapped != MMAPPED_CPU || MAP(bo->base.map__cpu) == bo->mem); 785903b705cfSriastradh 786003b705cfSriastradh bo->used = size; 786103b705cfSriastradh bo->write = flags & KGEM_BUFFER_WRITE_INPLACE; 786203b705cfSriastradh offset = 0; 786303b705cfSriastradh 786403b705cfSriastradh assert(list_is_empty(&bo->base.list)); 786503b705cfSriastradh list_add(&bo->base.list, &kgem->batch_buffers); 786603b705cfSriastradh 786703b705cfSriastradh DBG(("%s(pages=%d [%d]) new handle=%d, used=%d, write=%d\n", 786803b705cfSriastradh __FUNCTION__, num_pages(&bo->base), alloc, bo->base.handle, bo->used, bo->write)); 786903b705cfSriastradh 787003b705cfSriastradhdone: 787103b705cfSriastradh bo->used = ALIGN(bo->used, UPLOAD_ALIGNMENT); 78729a906b70Schristos assert(bo->used && bo->used <= bytes(&bo->base)); 787303b705cfSriastradh assert(bo->mem); 787403b705cfSriastradh *ret = (char *)bo->mem + offset; 787503b705cfSriastradh return kgem_create_proxy(kgem, &bo->base, offset, size); 787603b705cfSriastradh} 787703b705cfSriastradh 787803b705cfSriastradhbool kgem_buffer_is_inplace(struct kgem_bo *_bo) 787903b705cfSriastradh{ 788003b705cfSriastradh struct kgem_buffer *bo = (struct kgem_buffer *)_bo->proxy; 788103b705cfSriastradh return bo->write & KGEM_BUFFER_WRITE_INPLACE; 788203b705cfSriastradh} 788303b705cfSriastradh 788403b705cfSriastradhstruct kgem_bo *kgem_create_buffer_2d(struct kgem *kgem, 788503b705cfSriastradh int width, int height, int bpp, 788603b705cfSriastradh uint32_t flags, 788703b705cfSriastradh void **ret) 788803b705cfSriastradh{ 788903b705cfSriastradh struct kgem_bo *bo; 789003b705cfSriastradh int stride; 789103b705cfSriastradh 789203b705cfSriastradh assert(width > 0 && height > 0); 789303b705cfSriastradh assert(ret != NULL); 789403b705cfSriastradh stride = ALIGN(width, 2) * bpp >> 3; 7895813957e3Ssnj stride = ALIGN(stride, kgem->gen >= 0100 ? 32 : 4); 789603b705cfSriastradh 789703b705cfSriastradh DBG(("%s: %dx%d, %d bpp, stride=%d\n", 789803b705cfSriastradh __FUNCTION__, width, height, bpp, stride)); 789903b705cfSriastradh 790003b705cfSriastradh bo = kgem_create_buffer(kgem, stride * ALIGN(height, 2), flags, ret); 790103b705cfSriastradh if (bo == NULL) { 790203b705cfSriastradh DBG(("%s: allocation failure for upload buffer\n", 790303b705cfSriastradh __FUNCTION__)); 790403b705cfSriastradh return NULL; 790503b705cfSriastradh } 790603b705cfSriastradh assert(*ret != NULL); 790703b705cfSriastradh assert(bo->proxy != NULL); 790803b705cfSriastradh 790903b705cfSriastradh if (height & 1) { 791003b705cfSriastradh struct kgem_buffer *io = (struct kgem_buffer *)bo->proxy; 791103b705cfSriastradh int min; 791203b705cfSriastradh 791303b705cfSriastradh assert(io->used); 791403b705cfSriastradh 791503b705cfSriastradh /* Having padded this surface to ensure that accesses to 791603b705cfSriastradh * the last pair of rows is valid, remove the padding so 791703b705cfSriastradh * that it can be allocated to other pixmaps. 791803b705cfSriastradh */ 791903b705cfSriastradh min = bo->delta + height * stride; 792003b705cfSriastradh min = ALIGN(min, UPLOAD_ALIGNMENT); 792103b705cfSriastradh if (io->used != min) { 792203b705cfSriastradh DBG(("%s: trimming buffer from %d to %d\n", 792303b705cfSriastradh __FUNCTION__, io->used, min)); 792403b705cfSriastradh io->used = min; 792503b705cfSriastradh } 792603b705cfSriastradh bo->size.bytes -= stride; 792703b705cfSriastradh } 792803b705cfSriastradh 79299a906b70Schristos bo->map__cpu = *ret; 793003b705cfSriastradh bo->pitch = stride; 793103b705cfSriastradh bo->unique_id = kgem_get_unique_id(kgem); 793203b705cfSriastradh return bo; 793303b705cfSriastradh} 793403b705cfSriastradh 793503b705cfSriastradhstruct kgem_bo *kgem_upload_source_image(struct kgem *kgem, 793603b705cfSriastradh const void *data, 793703b705cfSriastradh const BoxRec *box, 793803b705cfSriastradh int stride, int bpp) 793903b705cfSriastradh{ 794003b705cfSriastradh int width = box->x2 - box->x1; 794103b705cfSriastradh int height = box->y2 - box->y1; 794203b705cfSriastradh struct kgem_bo *bo; 794303b705cfSriastradh void *dst; 794403b705cfSriastradh 794503b705cfSriastradh if (!kgem_can_create_2d(kgem, width, height, bpp)) 794603b705cfSriastradh return NULL; 794703b705cfSriastradh 794803b705cfSriastradh DBG(("%s : (%d, %d), (%d, %d), stride=%d, bpp=%d\n", 794903b705cfSriastradh __FUNCTION__, box->x1, box->y1, box->x2, box->y2, stride, bpp)); 795003b705cfSriastradh 795103b705cfSriastradh assert(data); 795203b705cfSriastradh assert(width > 0); 795303b705cfSriastradh assert(height > 0); 795403b705cfSriastradh assert(stride); 795503b705cfSriastradh assert(bpp); 795603b705cfSriastradh 795703b705cfSriastradh bo = kgem_create_buffer_2d(kgem, 795803b705cfSriastradh width, height, bpp, 795903b705cfSriastradh KGEM_BUFFER_WRITE_INPLACE, &dst); 79609a906b70Schristos if (bo == NULL) 79619a906b70Schristos return NULL; 79629a906b70Schristos 79639a906b70Schristos if (sigtrap_get()) { 79649a906b70Schristos kgem_bo_destroy(kgem, bo); 79659a906b70Schristos return NULL; 79669a906b70Schristos } 79679a906b70Schristos 79689a906b70Schristos memcpy_blt(data, dst, bpp, 79699a906b70Schristos stride, bo->pitch, 79709a906b70Schristos box->x1, box->y1, 79719a906b70Schristos 0, 0, 79729a906b70Schristos width, height); 797303b705cfSriastradh 79749a906b70Schristos sigtrap_put(); 797503b705cfSriastradh return bo; 797603b705cfSriastradh} 797703b705cfSriastradh 797803b705cfSriastradhvoid kgem_proxy_bo_attach(struct kgem_bo *bo, 797903b705cfSriastradh struct kgem_bo **ptr) 798003b705cfSriastradh{ 798103b705cfSriastradh DBG(("%s: handle=%d\n", __FUNCTION__, bo->handle)); 79829a906b70Schristos assert(bo->map__gtt == NULL); 798303b705cfSriastradh assert(bo->proxy); 798403b705cfSriastradh list_add(&bo->vma, &bo->proxy->vma); 79859a906b70Schristos bo->map__gtt = ptr; 798603b705cfSriastradh *ptr = kgem_bo_reference(bo); 798703b705cfSriastradh} 798803b705cfSriastradh 798903b705cfSriastradhvoid kgem_buffer_read_sync(struct kgem *kgem, struct kgem_bo *_bo) 799003b705cfSriastradh{ 799103b705cfSriastradh struct kgem_buffer *bo; 799203b705cfSriastradh uint32_t offset = _bo->delta, length = _bo->size.bytes; 799303b705cfSriastradh 799403b705cfSriastradh /* We expect the caller to have already submitted the batch */ 799503b705cfSriastradh assert(_bo->io); 799603b705cfSriastradh assert(_bo->exec == NULL); 799703b705cfSriastradh assert(_bo->rq == NULL); 799803b705cfSriastradh assert(_bo->proxy); 799903b705cfSriastradh 800003b705cfSriastradh _bo = _bo->proxy; 800103b705cfSriastradh assert(_bo->proxy == NULL); 800203b705cfSriastradh assert(_bo->exec == NULL); 800303b705cfSriastradh 800403b705cfSriastradh bo = (struct kgem_buffer *)_bo; 800503b705cfSriastradh 800603b705cfSriastradh DBG(("%s(offset=%d, length=%d, snooped=%d)\n", __FUNCTION__, 800703b705cfSriastradh offset, length, bo->base.snoop)); 800803b705cfSriastradh 800903b705cfSriastradh if (bo->mmapped) { 801003b705cfSriastradh struct drm_i915_gem_set_domain set_domain; 801103b705cfSriastradh 801203b705cfSriastradh DBG(("%s: sync: needs_flush? %d, domain? %d, busy? %d\n", 801303b705cfSriastradh __FUNCTION__, 801403b705cfSriastradh bo->base.needs_flush, 801503b705cfSriastradh bo->base.domain, 801603b705cfSriastradh __kgem_busy(kgem, bo->base.handle))); 801703b705cfSriastradh 80189a906b70Schristos assert(bo->mmapped == MMAPPED_GTT || bo->base.snoop || kgem->has_llc); 801903b705cfSriastradh 802003b705cfSriastradh VG_CLEAR(set_domain); 802103b705cfSriastradh set_domain.handle = bo->base.handle; 802203b705cfSriastradh set_domain.write_domain = 0; 802303b705cfSriastradh set_domain.read_domains = 80249a906b70Schristos bo->mmapped == MMAPPED_CPU ? I915_GEM_DOMAIN_CPU : I915_GEM_DOMAIN_GTT; 802503b705cfSriastradh 80269a906b70Schristos if (do_ioctl(kgem->fd, DRM_IOCTL_I915_GEM_SET_DOMAIN, &set_domain)) { 80279a906b70Schristos DBG(("%s: sync: GPU hang detected\n", __FUNCTION__)); 80289a906b70Schristos kgem_throttle(kgem); 80299a906b70Schristos } 803003b705cfSriastradh } else { 803103b705cfSriastradh if (gem_read(kgem->fd, 803203b705cfSriastradh bo->base.handle, (char *)bo->mem+offset, 803303b705cfSriastradh offset, length)) 803403b705cfSriastradh return; 803503b705cfSriastradh } 80369a906b70Schristos kgem_bo_maybe_retire(kgem, &bo->base); 803703b705cfSriastradh bo->base.domain = DOMAIN_NONE; 803803b705cfSriastradh} 803903b705cfSriastradh 804003b705cfSriastradhuint32_t kgem_bo_get_binding(struct kgem_bo *bo, uint32_t format) 804103b705cfSriastradh{ 804203b705cfSriastradh struct kgem_bo_binding *b; 804303b705cfSriastradh 80449a906b70Schristos assert(bo->refcnt); 80459a906b70Schristos 804603b705cfSriastradh for (b = &bo->binding; b && b->offset; b = b->next) 804703b705cfSriastradh if (format == b->format) 804803b705cfSriastradh return b->offset; 804903b705cfSriastradh 805003b705cfSriastradh return 0; 805103b705cfSriastradh} 805203b705cfSriastradh 805303b705cfSriastradhvoid kgem_bo_set_binding(struct kgem_bo *bo, uint32_t format, uint16_t offset) 805403b705cfSriastradh{ 805503b705cfSriastradh struct kgem_bo_binding *b; 805603b705cfSriastradh 80579a906b70Schristos assert(bo->refcnt); 80589a906b70Schristos 805903b705cfSriastradh for (b = &bo->binding; b; b = b->next) { 806003b705cfSriastradh if (b->offset) 806103b705cfSriastradh continue; 806203b705cfSriastradh 806303b705cfSriastradh b->offset = offset; 806403b705cfSriastradh b->format = format; 806503b705cfSriastradh 806603b705cfSriastradh if (b->next) 806703b705cfSriastradh b->next->offset = 0; 806803b705cfSriastradh 806903b705cfSriastradh return; 807003b705cfSriastradh } 807103b705cfSriastradh 807203b705cfSriastradh b = malloc(sizeof(*b)); 807303b705cfSriastradh if (b) { 807403b705cfSriastradh b->next = bo->binding.next; 807503b705cfSriastradh b->format = format; 807603b705cfSriastradh b->offset = offset; 807703b705cfSriastradh bo->binding.next = b; 807803b705cfSriastradh } 807903b705cfSriastradh} 808003b705cfSriastradh 808103b705cfSriastradhstruct kgem_bo * 808203b705cfSriastradhkgem_replace_bo(struct kgem *kgem, 808303b705cfSriastradh struct kgem_bo *src, 808403b705cfSriastradh uint32_t width, 808503b705cfSriastradh uint32_t height, 808603b705cfSriastradh uint32_t pitch, 808703b705cfSriastradh uint32_t bpp) 808803b705cfSriastradh{ 808903b705cfSriastradh struct kgem_bo *dst; 809003b705cfSriastradh uint32_t br00, br13; 809103b705cfSriastradh uint32_t handle; 809203b705cfSriastradh uint32_t size; 809303b705cfSriastradh uint32_t *b; 809403b705cfSriastradh 809503b705cfSriastradh DBG(("%s: replacing bo handle=%d, size=%dx%d pitch=%d, with pitch=%d\n", 809603b705cfSriastradh __FUNCTION__, src->handle, width, height, src->pitch, pitch)); 809703b705cfSriastradh 809803b705cfSriastradh /* We only expect to be called to fixup small buffers, hence why 809903b705cfSriastradh * we only attempt to allocate a linear bo. 810003b705cfSriastradh */ 810103b705cfSriastradh assert(src->tiling == I915_TILING_NONE); 81029a906b70Schristos assert(kgem_bo_can_blt(kgem, src)); 810303b705cfSriastradh 810403b705cfSriastradh size = height * pitch; 810503b705cfSriastradh size = NUM_PAGES(size); 810603b705cfSriastradh 810703b705cfSriastradh dst = search_linear_cache(kgem, size, 0); 810803b705cfSriastradh if (dst == NULL) 810903b705cfSriastradh dst = search_linear_cache(kgem, size, CREATE_INACTIVE); 811003b705cfSriastradh if (dst == NULL) { 811103b705cfSriastradh handle = gem_create(kgem->fd, size); 811203b705cfSriastradh if (handle == 0) 811303b705cfSriastradh return NULL; 811403b705cfSriastradh 811503b705cfSriastradh dst = __kgem_bo_alloc(handle, size); 811603b705cfSriastradh if (dst == NULL) { 811703b705cfSriastradh gem_close(kgem->fd, handle); 811803b705cfSriastradh return NULL; 811903b705cfSriastradh } 812003b705cfSriastradh 812103b705cfSriastradh debug_alloc__bo(kgem, dst); 812203b705cfSriastradh } 812303b705cfSriastradh dst->pitch = pitch; 812403b705cfSriastradh dst->unique_id = kgem_get_unique_id(kgem); 812503b705cfSriastradh dst->refcnt = 1; 81269a906b70Schristos assert(dst->tiling == I915_TILING_NONE); 81279a906b70Schristos assert(kgem_bo_can_blt(kgem, dst)); 812803b705cfSriastradh 812903b705cfSriastradh kgem_set_mode(kgem, KGEM_BLT, dst); 81309a906b70Schristos if (!kgem_check_batch(kgem, 10) || 813103b705cfSriastradh !kgem_check_reloc(kgem, 2) || 813203b705cfSriastradh !kgem_check_many_bo_fenced(kgem, src, dst, NULL)) { 813303b705cfSriastradh kgem_submit(kgem); 813403b705cfSriastradh if (!kgem_check_many_bo_fenced(kgem, src, dst, NULL)) { 813503b705cfSriastradh kgem_bo_destroy(kgem, dst); 813603b705cfSriastradh return NULL; 813703b705cfSriastradh } 813803b705cfSriastradh _kgem_set_mode(kgem, KGEM_BLT); 813903b705cfSriastradh } 814063ef14f0Smrg kgem_bcs_set_tiling(kgem, src, dst); 814103b705cfSriastradh 814203b705cfSriastradh br00 = XY_SRC_COPY_BLT_CMD; 814303b705cfSriastradh br13 = pitch; 814403b705cfSriastradh pitch = src->pitch; 814503b705cfSriastradh if (kgem->gen >= 040 && src->tiling) { 814603b705cfSriastradh br00 |= BLT_SRC_TILED; 814703b705cfSriastradh pitch >>= 2; 814803b705cfSriastradh } 814903b705cfSriastradh 815003b705cfSriastradh br13 |= 0xcc << 16; 815103b705cfSriastradh switch (bpp) { 815203b705cfSriastradh default: 815303b705cfSriastradh case 32: br00 |= BLT_WRITE_ALPHA | BLT_WRITE_RGB; 815403b705cfSriastradh br13 |= 1 << 25; /* RGB8888 */ 815503b705cfSriastradh case 16: br13 |= 1 << 24; /* RGB565 */ 815603b705cfSriastradh case 8: break; 815703b705cfSriastradh } 815803b705cfSriastradh 815903b705cfSriastradh b = kgem->batch + kgem->nbatch; 81609a906b70Schristos if (kgem->gen >= 0100) { 81619a906b70Schristos b[0] = br00 | 8; 81629a906b70Schristos b[1] = br13; 81639a906b70Schristos b[2] = 0; 81649a906b70Schristos b[3] = height << 16 | width; 81659a906b70Schristos *(uint64_t *)(b+4) = 81669a906b70Schristos kgem_add_reloc64(kgem, kgem->nbatch + 4, dst, 81679a906b70Schristos I915_GEM_DOMAIN_RENDER << 16 | 81689a906b70Schristos I915_GEM_DOMAIN_RENDER | 81699a906b70Schristos KGEM_RELOC_FENCED, 81709a906b70Schristos 0); 81719a906b70Schristos b[6] = 0; 81729a906b70Schristos b[7] = pitch; 81739a906b70Schristos *(uint64_t *)(b+8) = 81749a906b70Schristos kgem_add_reloc64(kgem, kgem->nbatch + 8, src, 81759a906b70Schristos I915_GEM_DOMAIN_RENDER << 16 | 81769a906b70Schristos KGEM_RELOC_FENCED, 81779a906b70Schristos 0); 81789a906b70Schristos kgem->nbatch += 10; 81799a906b70Schristos } else { 81809a906b70Schristos b[0] = br00 | 6; 81819a906b70Schristos b[1] = br13; 81829a906b70Schristos b[2] = 0; 81839a906b70Schristos b[3] = height << 16 | width; 81849a906b70Schristos b[4] = kgem_add_reloc(kgem, kgem->nbatch + 4, dst, 81859a906b70Schristos I915_GEM_DOMAIN_RENDER << 16 | 81869a906b70Schristos I915_GEM_DOMAIN_RENDER | 81879a906b70Schristos KGEM_RELOC_FENCED, 81889a906b70Schristos 0); 81899a906b70Schristos b[5] = 0; 81909a906b70Schristos b[6] = pitch; 81919a906b70Schristos b[7] = kgem_add_reloc(kgem, kgem->nbatch + 7, src, 81929a906b70Schristos I915_GEM_DOMAIN_RENDER << 16 | 81939a906b70Schristos KGEM_RELOC_FENCED, 81949a906b70Schristos 0); 81959a906b70Schristos kgem->nbatch += 8; 81969a906b70Schristos } 819703b705cfSriastradh 819803b705cfSriastradh return dst; 819903b705cfSriastradh} 82009a906b70Schristos 82019a906b70Schristosbool kgem_bo_convert_to_gpu(struct kgem *kgem, 82029a906b70Schristos struct kgem_bo *bo, 82039a906b70Schristos unsigned flags) 82049a906b70Schristos{ 8205813957e3Ssnj DBG(("%s: converting handle=%d from CPU to GPU, flags=%x, busy?=%d\n", 8206813957e3Ssnj __FUNCTION__, bo->handle, flags, __kgem_bo_is_busy(kgem, bo))); 82079a906b70Schristos assert(bo->tiling == I915_TILING_NONE); 82089a906b70Schristos 820963ef14f0Smrg if (flags & (__MOVE_PRIME | __MOVE_SCANOUT)) 821063ef14f0Smrg return false; 821163ef14f0Smrg 82129a906b70Schristos if (kgem->has_llc) 82139a906b70Schristos return true; 82149a906b70Schristos 82159a906b70Schristos if (flags & MOVE_ASYNC_HINT && __kgem_bo_is_busy(kgem, bo)) 82169a906b70Schristos return false; 82179a906b70Schristos 82189a906b70Schristos assert(bo->snoop); 82199a906b70Schristos 82209a906b70Schristos kgem_bo_submit(kgem, bo); 82219a906b70Schristos 82229a906b70Schristos if (!gem_set_caching(kgem->fd, bo->handle, UNCACHED)) 82239a906b70Schristos return false; 82249a906b70Schristos 82259a906b70Schristos bo->snoop = false; 82269a906b70Schristos return true; 82279a906b70Schristos} 8228