1 /* $NetBSD: radeon_sync.c,v 1.3 2021/12/18 23:45:43 riastradh Exp $ */ 2 3 /* 4 * Copyright 2014 Advanced Micro Devices, Inc. 5 * All Rights Reserved. 6 * 7 * Permission is hereby granted, free of charge, to any person obtaining a 8 * copy of this software and associated documentation files (the 9 * "Software"), to deal in the Software without restriction, including 10 * without limitation the rights to use, copy, modify, merge, publish, 11 * distribute, sub license, and/or sell copies of the Software, and to 12 * permit persons to whom the Software is furnished to do so, subject to 13 * the following conditions: 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 18 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, 19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 21 * USE OR OTHER DEALINGS IN THE SOFTWARE. 22 * 23 * The above copyright notice and this permission notice (including the 24 * next paragraph) shall be included in all copies or substantial portions 25 * of the Software. 26 * 27 */ 28 /* 29 * Authors: 30 * Christian Knig <christian.koenig (at) amd.com> 31 */ 32 33 #include <sys/cdefs.h> 34 __KERNEL_RCSID(0, "$NetBSD: radeon_sync.c,v 1.3 2021/12/18 23:45:43 riastradh Exp $"); 35 36 #include "radeon.h" 37 #include "radeon_trace.h" 38 39 /** 40 * radeon_sync_create - zero init sync object 41 * 42 * @sync: sync object to initialize 43 * 44 * Just clear the sync object for now. 45 */ 46 void radeon_sync_create(struct radeon_sync *sync) 47 { 48 unsigned i; 49 50 for (i = 0; i < RADEON_NUM_SYNCS; ++i) 51 sync->semaphores[i] = NULL; 52 53 for (i = 0; i < RADEON_NUM_RINGS; ++i) 54 sync->sync_to[i] = NULL; 55 56 sync->last_vm_update = NULL; 57 } 58 59 /** 60 * radeon_sync_fence - use the semaphore to sync to a fence 61 * 62 * @sync: sync object to add fence to 63 * @fence: fence to sync to 64 * 65 * Sync to the fence using the semaphore objects 66 */ 67 void radeon_sync_fence(struct radeon_sync *sync, 68 struct radeon_fence *fence) 69 { 70 struct radeon_fence *other; 71 72 if (!fence) 73 return; 74 75 other = sync->sync_to[fence->ring]; 76 sync->sync_to[fence->ring] = radeon_fence_later(fence, other); 77 78 if (fence->is_vm_update) { 79 other = sync->last_vm_update; 80 sync->last_vm_update = radeon_fence_later(fence, other); 81 } 82 } 83 84 /** 85 * radeon_sync_resv - use the semaphores to sync to a reservation object 86 * 87 * @sync: sync object to add fences from reservation object to 88 * @resv: reservation object with embedded fence 89 * @shared: true if we should only sync to the exclusive fence 90 * 91 * Sync to the fence using the semaphore objects 92 */ 93 int radeon_sync_resv(struct radeon_device *rdev, 94 struct radeon_sync *sync, 95 struct dma_resv *resv, 96 bool shared) 97 { 98 struct dma_resv_list *flist; 99 struct dma_fence *f; 100 struct radeon_fence *fence; 101 unsigned i; 102 int r = 0; 103 104 /* always sync to the exclusive fence */ 105 f = dma_resv_get_excl(resv); 106 fence = f ? to_radeon_fence(f) : NULL; 107 if (fence && fence->rdev == rdev) 108 radeon_sync_fence(sync, fence); 109 else if (f) 110 r = dma_fence_wait(f, true); 111 112 flist = dma_resv_get_list(resv); 113 if (shared || !flist || r) 114 return r; 115 116 for (i = 0; i < flist->shared_count; ++i) { 117 f = rcu_dereference_protected(flist->shared[i], 118 dma_resv_held(resv)); 119 fence = to_radeon_fence(f); 120 if (fence && fence->rdev == rdev) 121 radeon_sync_fence(sync, fence); 122 else 123 r = dma_fence_wait(f, true); 124 125 if (r) 126 break; 127 } 128 return r; 129 } 130 131 /** 132 * radeon_sync_rings - sync ring to all registered fences 133 * 134 * @rdev: radeon_device pointer 135 * @sync: sync object to use 136 * @ring: ring that needs sync 137 * 138 * Ensure that all registered fences are signaled before letting 139 * the ring continue. The caller must hold the ring lock. 140 */ 141 int radeon_sync_rings(struct radeon_device *rdev, 142 struct radeon_sync *sync, 143 int ring) 144 { 145 unsigned count = 0; 146 int i, r; 147 148 for (i = 0; i < RADEON_NUM_RINGS; ++i) { 149 struct radeon_fence *fence = sync->sync_to[i]; 150 struct radeon_semaphore *semaphore; 151 152 /* check if we really need to sync */ 153 if (!radeon_fence_need_sync(fence, ring)) 154 continue; 155 156 /* prevent GPU deadlocks */ 157 if (!rdev->ring[i].ready) { 158 dev_err(rdev->dev, "Syncing to a disabled ring!"); 159 return -EINVAL; 160 } 161 162 if (count >= RADEON_NUM_SYNCS) { 163 /* not enough room, wait manually */ 164 r = radeon_fence_wait(fence, false); 165 if (r) 166 return r; 167 continue; 168 } 169 r = radeon_semaphore_create(rdev, &semaphore); 170 if (r) 171 return r; 172 173 sync->semaphores[count++] = semaphore; 174 175 /* allocate enough space for sync command */ 176 r = radeon_ring_alloc(rdev, &rdev->ring[i], 16); 177 if (r) 178 return r; 179 180 /* emit the signal semaphore */ 181 if (!radeon_semaphore_emit_signal(rdev, i, semaphore)) { 182 /* signaling wasn't successful wait manually */ 183 radeon_ring_undo(&rdev->ring[i]); 184 r = radeon_fence_wait(fence, false); 185 if (r) 186 return r; 187 continue; 188 } 189 190 /* we assume caller has already allocated space on waiters ring */ 191 if (!radeon_semaphore_emit_wait(rdev, ring, semaphore)) { 192 /* waiting wasn't successful wait manually */ 193 radeon_ring_undo(&rdev->ring[i]); 194 r = radeon_fence_wait(fence, false); 195 if (r) 196 return r; 197 continue; 198 } 199 200 radeon_ring_commit(rdev, &rdev->ring[i], false); 201 radeon_fence_note_sync(fence, ring); 202 } 203 204 return 0; 205 } 206 207 /** 208 * radeon_sync_free - free the sync object 209 * 210 * @rdev: radeon_device pointer 211 * @sync: sync object to use 212 * @fence: fence to use for the free 213 * 214 * Free the sync object by freeing all semaphores in it. 215 */ 216 void radeon_sync_free(struct radeon_device *rdev, 217 struct radeon_sync *sync, 218 struct radeon_fence *fence) 219 { 220 unsigned i; 221 222 for (i = 0; i < RADEON_NUM_SYNCS; ++i) 223 radeon_semaphore_free(rdev, &sync->semaphores[i], fence); 224 } 225