1/* 2 * Copyright © 2008-2012 Intel Corporation 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice (including the next 12 * paragraph) shall be included in all copies or substantial portions of the 13 * Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 21 * IN THE SOFTWARE. 22 * 23 * Authors: 24 * Eric Anholt <eric@anholt.net> 25 * 26 */ 27 28/** 29 * @file brw_bufmgr.h 30 * 31 * Public definitions of Intel-specific bufmgr functions. 32 */ 33 34#ifndef BRW_BUFMGR_H 35#define BRW_BUFMGR_H 36 37#include <stdbool.h> 38#include <stdint.h> 39#include <stdio.h> 40#include <time.h> 41 42#include "c11/threads.h" 43#include "util/u_atomic.h" 44#include "util/list.h" 45 46#if defined(__cplusplus) 47extern "C" { 48#endif 49 50struct intel_device_info; 51struct brw_context; 52 53/** 54 * Memory zones. When allocating a buffer, you can request that it is 55 * placed into a specific region of the virtual address space (PPGTT). 56 * 57 * Most buffers can go anywhere (BRW_MEMZONE_OTHER). Some buffers are 58 * accessed via an offset from a base address. STATE_BASE_ADDRESS has 59 * a maximum 4GB size for each region, so we need to restrict those 60 * buffers to be within 4GB of the base. Each memory zone corresponds 61 * to a particular base address. 62 * 63 * Currently, i965 partitions the address space into two regions: 64 * 65 * - Low 4GB 66 * - Full 48-bit address space 67 * 68 * Eventually, we hope to carve out 4GB of VMA for each base address. 69 */ 70enum brw_memory_zone { 71 BRW_MEMZONE_LOW_4G, 72 BRW_MEMZONE_OTHER, 73 74 /* Shaders - Instruction State Base Address */ 75 BRW_MEMZONE_SHADER = BRW_MEMZONE_LOW_4G, 76 77 /* Scratch - General State Base Address */ 78 BRW_MEMZONE_SCRATCH = BRW_MEMZONE_LOW_4G, 79 80 /* Surface State Base Address */ 81 BRW_MEMZONE_SURFACE = BRW_MEMZONE_LOW_4G, 82 83 /* Dynamic State Base Address */ 84 BRW_MEMZONE_DYNAMIC = BRW_MEMZONE_LOW_4G, 85}; 86 87#define BRW_MEMZONE_COUNT (BRW_MEMZONE_OTHER + 1) 88 89struct brw_bo { 90 /** 91 * Size in bytes of the buffer object. 92 * 93 * The size may be larger than the size originally requested for the 94 * allocation, such as being aligned to page size. 95 */ 96 uint64_t size; 97 98 /** Buffer manager context associated with this buffer object */ 99 struct brw_bufmgr *bufmgr; 100 101 /** The GEM handle for this buffer object. */ 102 uint32_t gem_handle; 103 104 /** 105 * Offset of the buffer inside the Graphics Translation Table. 106 * 107 * This is effectively our GPU address for the buffer and we use it 108 * as our base for all state pointers into the buffer. However, since the 109 * kernel may be forced to move it around during the course of the 110 * buffer's lifetime, we can only know where the buffer was on the last 111 * execbuf. We presume, and are usually right, that the buffer will not 112 * move and so we use that last offset for the next batch and by doing 113 * so we can avoid having the kernel perform a relocation fixup pass as 114 * our pointers inside the batch will be using the correct base offset. 115 * 116 * Since we do use it as a base address for the next batch of pointers, 117 * the kernel treats our offset as a request, and if possible will 118 * arrange the buffer to placed at that address (trying to balance 119 * the cost of buffer migration versus the cost of performing 120 * relocations). Furthermore, we can force the kernel to place the buffer, 121 * or report a failure if we specified a conflicting offset, at our chosen 122 * offset by specifying EXEC_OBJECT_PINNED. 123 * 124 * Note the GTT may be either per context, or shared globally across the 125 * system. On a shared system, our buffers have to contend for address 126 * space with both aperture mappings and framebuffers and so are more 127 * likely to be moved. On a full ppGTT system, each batch exists in its 128 * own GTT, and so each buffer may have their own offset within each 129 * context. 130 */ 131 uint64_t gtt_offset; 132 133 /** 134 * The validation list index for this buffer, or -1 when not in a batch. 135 * Note that a single buffer may be in multiple batches (contexts), and 136 * this is a global field, which refers to the last batch using the BO. 137 * It should not be considered authoritative, but can be used to avoid a 138 * linear walk of the validation list in the common case by guessing that 139 * exec_bos[bo->index] == bo and confirming whether that's the case. 140 */ 141 unsigned index; 142 143 /** 144 * Boolean of whether the GPU is definitely not accessing the buffer. 145 * 146 * This is only valid when reusable, since non-reusable 147 * buffers are those that have been shared with other 148 * processes, so we don't know their state. 149 */ 150 bool idle; 151 152 int refcount; 153 const char *name; 154 155 uint64_t kflags; 156 157 /** 158 * Kenel-assigned global name for this object 159 * 160 * List contains both flink named and prime fd'd objects 161 */ 162 unsigned int global_name; 163 164 /** 165 * Current tiling mode 166 */ 167 uint32_t tiling_mode; 168 uint32_t swizzle_mode; 169 uint32_t stride; 170 171 time_t free_time; 172 173 /** Mapped address for the buffer, saved across map/unmap cycles */ 174 void *map_cpu; 175 /** GTT virtual address for the buffer, saved across map/unmap cycles */ 176 void *map_gtt; 177 /** WC CPU address for the buffer, saved across map/unmap cycles */ 178 void *map_wc; 179 180 /** BO cache list */ 181 struct list_head head; 182 183 /** 184 * List of GEM handle exports of this buffer (bo_export). 185 * 186 * Hold bufmgr->lock when using this list. 187 */ 188 struct list_head exports; 189 190 /** 191 * Boolean of whether this buffer can be re-used 192 */ 193 bool reusable; 194 195 /** 196 * Boolean of whether this buffer has been shared with an external client. 197 */ 198 bool external; 199 200 /** 201 * Boolean of whether this buffer is cache coherent 202 */ 203 bool cache_coherent; 204}; 205 206#define BO_ALLOC_BUSY (1<<0) 207#define BO_ALLOC_ZEROED (1<<1) 208 209/** 210 * Allocate a buffer object. 211 * 212 * Buffer objects are not necessarily initially mapped into CPU virtual 213 * address space or graphics device aperture. They must be mapped 214 * using brw_bo_map() to be used by the CPU. 215 */ 216struct brw_bo *brw_bo_alloc(struct brw_bufmgr *bufmgr, const char *name, 217 uint64_t size, enum brw_memory_zone memzone); 218 219/** 220 * Allocate a tiled buffer object. 221 * 222 * Alignment for tiled objects is set automatically; the 'flags' 223 * argument provides a hint about how the object will be used initially. 224 * 225 * Valid tiling formats are: 226 * I915_TILING_NONE 227 * I915_TILING_X 228 * I915_TILING_Y 229 */ 230struct brw_bo *brw_bo_alloc_tiled(struct brw_bufmgr *bufmgr, 231 const char *name, 232 uint64_t size, 233 enum brw_memory_zone memzone, 234 uint32_t tiling_mode, 235 uint32_t pitch, 236 unsigned flags); 237 238/** 239 * Allocate a tiled buffer object. 240 * 241 * Alignment for tiled objects is set automatically; the 'flags' 242 * argument provides a hint about how the object will be used initially. 243 * 244 * Valid tiling formats are: 245 * I915_TILING_NONE 246 * I915_TILING_X 247 * I915_TILING_Y 248 * 249 * Note the tiling format may be rejected; callers should check the 250 * 'tiling_mode' field on return, as well as the pitch value, which 251 * may have been rounded up to accommodate for tiling restrictions. 252 */ 253struct brw_bo *brw_bo_alloc_tiled_2d(struct brw_bufmgr *bufmgr, 254 const char *name, 255 int x, int y, int cpp, 256 enum brw_memory_zone memzone, 257 uint32_t tiling_mode, 258 uint32_t *pitch, 259 unsigned flags); 260 261/** Takes a reference on a buffer object */ 262static inline void 263brw_bo_reference(struct brw_bo *bo) 264{ 265 p_atomic_inc(&bo->refcount); 266} 267 268/** 269 * Releases a reference on a buffer object, freeing the data if 270 * no references remain. 271 */ 272void brw_bo_unreference(struct brw_bo *bo); 273 274/* Must match MapBufferRange interface (for convenience) */ 275#define MAP_READ GL_MAP_READ_BIT 276#define MAP_WRITE GL_MAP_WRITE_BIT 277#define MAP_ASYNC GL_MAP_UNSYNCHRONIZED_BIT 278#define MAP_PERSISTENT GL_MAP_PERSISTENT_BIT 279#define MAP_COHERENT GL_MAP_COHERENT_BIT 280/* internal */ 281#define MAP_INTERNAL_MASK (0xffu << 24) 282#define MAP_RAW (0x01 << 24) 283 284/** 285 * Maps the buffer into userspace. 286 * 287 * This function will block waiting for any existing execution on the 288 * buffer to complete, first. The resulting mapping is returned. 289 */ 290MUST_CHECK void *brw_bo_map(struct brw_context *brw, struct brw_bo *bo, unsigned flags); 291 292/** 293 * Reduces the refcount on the userspace mapping of the buffer 294 * object. 295 */ 296static inline int brw_bo_unmap(UNUSED struct brw_bo *bo) { return 0; } 297 298/** Write data into an object. */ 299int brw_bo_subdata(struct brw_bo *bo, uint64_t offset, 300 uint64_t size, const void *data); 301/** 302 * Waits for rendering to an object by the GPU to have completed. 303 * 304 * This is not required for any access to the BO by bo_map, 305 * bo_subdata, etc. It is merely a way for the driver to implement 306 * glFinish. 307 */ 308void brw_bo_wait_rendering(struct brw_bo *bo); 309 310/** 311 * Unref a buffer manager instance. 312 */ 313void brw_bufmgr_unref(struct brw_bufmgr *bufmgr); 314 315/** 316 * Get the current tiling (and resulting swizzling) mode for the bo. 317 * 318 * \param buf Buffer to get tiling mode for 319 * \param tiling_mode returned tiling mode 320 * \param swizzle_mode returned swizzling mode 321 */ 322int brw_bo_get_tiling(struct brw_bo *bo, uint32_t *tiling_mode, 323 uint32_t *swizzle_mode); 324 325/** 326 * Create a visible name for a buffer which can be used by other apps 327 * 328 * \param buf Buffer to create a name for 329 * \param name Returned name 330 */ 331int brw_bo_flink(struct brw_bo *bo, uint32_t *name); 332 333/** 334 * Returns 1 if mapping the buffer for write could cause the process 335 * to block, due to the object being active in the GPU. 336 */ 337int brw_bo_busy(struct brw_bo *bo); 338 339/** 340 * Specify the volatility of the buffer. 341 * \param bo Buffer to create a name for 342 * \param madv The purgeable status 343 * 344 * Use I915_MADV_DONTNEED to mark the buffer as purgeable, and it will be 345 * reclaimed under memory pressure. If you subsequently require the buffer, 346 * then you must pass I915_MADV_WILLNEED to mark the buffer as required. 347 * 348 * Returns 1 if the buffer was retained, or 0 if it was discarded whilst 349 * marked as I915_MADV_DONTNEED. 350 */ 351int brw_bo_madvise(struct brw_bo *bo, int madv); 352 353struct brw_bufmgr *brw_bufmgr_get_for_fd(struct intel_device_info *devinfo, 354 int fd, bool bo_reuse); 355 356struct brw_bo *brw_bo_gem_create_from_name(struct brw_bufmgr *bufmgr, 357 const char *name, 358 unsigned int handle); 359 360int brw_bo_wait(struct brw_bo *bo, int64_t timeout_ns); 361 362uint32_t brw_create_hw_context(struct brw_bufmgr *bufmgr); 363 364int brw_hw_context_set_priority(struct brw_bufmgr *bufmgr, 365 uint32_t ctx_id, 366 int priority); 367 368void brw_destroy_hw_context(struct brw_bufmgr *bufmgr, uint32_t ctx_id); 369 370int brw_bufmgr_get_fd(struct brw_bufmgr *bufmgr); 371 372int brw_bo_gem_export_to_prime(struct brw_bo *bo, int *prime_fd); 373struct brw_bo *brw_bo_gem_create_from_prime(struct brw_bufmgr *bufmgr, 374 int prime_fd); 375struct brw_bo *brw_bo_gem_create_from_prime_tiled(struct brw_bufmgr *bufmgr, 376 int prime_fd, 377 uint32_t tiling_mode, 378 uint32_t stride); 379 380uint32_t brw_bo_export_gem_handle(struct brw_bo *bo); 381 382/** 383 * Exports a bo as a GEM handle into a given DRM file descriptor 384 * \param bo Buffer to export 385 * \param drm_fd File descriptor where the new handle is created 386 * \param out_handle Pointer to store the new handle 387 * 388 * Returns 0 if the buffer was successfully exported, a non zero error code 389 * otherwise. 390 */ 391int brw_bo_export_gem_handle_for_device(struct brw_bo *bo, int drm_fd, 392 uint32_t *out_handle); 393 394int brw_reg_read(struct brw_bufmgr *bufmgr, uint32_t offset, 395 uint64_t *result); 396 397bool brw_using_softpin(struct brw_bufmgr *bufmgr); 398 399/** @{ */ 400 401#if defined(__cplusplus) 402} 403#endif 404#endif /* BRW_BUFMGR_H */ 405