1 /* 2 * Copyright 2014 Advanced Micro Devices, Inc. 3 * All Rights Reserved. 4 * 5 * Permission is hereby granted, free of charge, to any person obtaining a 6 * copy of this software and associated documentation files (the 7 * "Software"), to deal in the Software without restriction, including 8 * without limitation the rights to use, copy, modify, merge, publish, 9 * distribute, sub license, and/or sell copies of the Software, and to 10 * permit persons to whom the Software is furnished to do so, subject to 11 * the following conditions: 12 * 13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 16 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, 17 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 18 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 19 * USE OR OTHER DEALINGS IN THE SOFTWARE. 20 * 21 * The above copyright notice and this permission notice (including the 22 * next paragraph) shall be included in all copies or substantial portions 23 * of the Software. 24 * 25 */ 26 /* 27 * Authors: 28 * Christian König <christian.koenig@amd.com> 29 */ 30 31 #include "radeon.h" 32 #include "radeon_trace.h" 33 34 /** 35 * radeon_sync_create - zero init sync object 36 * 37 * @sync: sync object to initialize 38 * 39 * Just clear the sync object for now. 40 */ 41 void radeon_sync_create(struct radeon_sync *sync) 42 { 43 unsigned i; 44 45 for (i = 0; i < RADEON_NUM_SYNCS; ++i) 46 sync->semaphores[i] = NULL; 47 48 for (i = 0; i < RADEON_NUM_RINGS; ++i) 49 sync->sync_to[i] = NULL; 50 51 sync->last_vm_update = NULL; 52 } 53 54 /** 55 * radeon_sync_fence - use the semaphore to sync to a fence 56 * 57 * @sync: sync object to add fence to 58 * @fence: fence to sync to 59 * 60 * Sync to the fence using the semaphore objects 61 */ 62 void radeon_sync_fence(struct radeon_sync *sync, 63 struct radeon_fence *fence) 64 { 65 struct radeon_fence *other; 66 67 if (!fence) 68 return; 69 70 other = sync->sync_to[fence->ring]; 71 sync->sync_to[fence->ring] = radeon_fence_later(fence, other); 72 73 if (fence->is_vm_update) { 74 other = sync->last_vm_update; 75 sync->last_vm_update = radeon_fence_later(fence, other); 76 } 77 } 78 79 /** 80 * radeon_sync_resv - use the semaphores to sync to a reservation object 81 * 82 * @rdev: radeon_device pointer 83 * @sync: sync object to add fences from reservation object to 84 * @resv: reservation object with embedded fence 85 * @shared: true if we should only sync to the exclusive fence 86 * 87 * Sync to the fence using the semaphore objects 88 */ 89 int radeon_sync_resv(struct radeon_device *rdev, 90 struct radeon_sync *sync, 91 struct dma_resv *resv, 92 bool shared) 93 { 94 struct dma_resv_list *flist; 95 struct dma_fence *f; 96 struct radeon_fence *fence; 97 unsigned i; 98 int r = 0; 99 100 /* always sync to the exclusive fence */ 101 f = dma_resv_get_excl(resv); 102 fence = f ? to_radeon_fence(f) : NULL; 103 if (fence && fence->rdev == rdev) 104 radeon_sync_fence(sync, fence); 105 else if (f) 106 r = dma_fence_wait(f, true); 107 108 flist = dma_resv_get_list(resv); 109 if (shared || !flist || r) 110 return r; 111 112 for (i = 0; i < flist->shared_count; ++i) { 113 f = rcu_dereference_protected(flist->shared[i], 114 dma_resv_held(resv)); 115 fence = to_radeon_fence(f); 116 if (fence && fence->rdev == rdev) 117 radeon_sync_fence(sync, fence); 118 else 119 r = dma_fence_wait(f, true); 120 121 if (r) 122 break; 123 } 124 return r; 125 } 126 127 /** 128 * radeon_sync_rings - sync ring to all registered fences 129 * 130 * @rdev: radeon_device pointer 131 * @sync: sync object to use 132 * @ring: ring that needs sync 133 * 134 * Ensure that all registered fences are signaled before letting 135 * the ring continue. The caller must hold the ring lock. 136 */ 137 int radeon_sync_rings(struct radeon_device *rdev, 138 struct radeon_sync *sync, 139 int ring) 140 { 141 unsigned count = 0; 142 int i, r; 143 144 for (i = 0; i < RADEON_NUM_RINGS; ++i) { 145 struct radeon_fence *fence = sync->sync_to[i]; 146 struct radeon_semaphore *semaphore; 147 148 /* check if we really need to sync */ 149 if (!radeon_fence_need_sync(fence, ring)) 150 continue; 151 152 /* prevent GPU deadlocks */ 153 if (!rdev->ring[i].ready) { 154 dev_err(rdev->dev, "Syncing to a disabled ring!"); 155 return -EINVAL; 156 } 157 158 if (count >= RADEON_NUM_SYNCS) { 159 /* not enough room, wait manually */ 160 r = radeon_fence_wait(fence, false); 161 if (r) 162 return r; 163 continue; 164 } 165 r = radeon_semaphore_create(rdev, &semaphore); 166 if (r) 167 return r; 168 169 sync->semaphores[count++] = semaphore; 170 171 /* allocate enough space for sync command */ 172 r = radeon_ring_alloc(rdev, &rdev->ring[i], 16); 173 if (r) 174 return r; 175 176 /* emit the signal semaphore */ 177 if (!radeon_semaphore_emit_signal(rdev, i, semaphore)) { 178 /* signaling wasn't successful wait manually */ 179 radeon_ring_undo(&rdev->ring[i]); 180 r = radeon_fence_wait(fence, false); 181 if (r) 182 return r; 183 continue; 184 } 185 186 /* we assume caller has already allocated space on waiters ring */ 187 if (!radeon_semaphore_emit_wait(rdev, ring, semaphore)) { 188 /* waiting wasn't successful wait manually */ 189 radeon_ring_undo(&rdev->ring[i]); 190 r = radeon_fence_wait(fence, false); 191 if (r) 192 return r; 193 continue; 194 } 195 196 radeon_ring_commit(rdev, &rdev->ring[i], false); 197 radeon_fence_note_sync(fence, ring); 198 } 199 200 return 0; 201 } 202 203 /** 204 * radeon_sync_free - free the sync object 205 * 206 * @rdev: radeon_device pointer 207 * @sync: sync object to use 208 * @fence: fence to use for the free 209 * 210 * Free the sync object by freeing all semaphores in it. 211 */ 212 void radeon_sync_free(struct radeon_device *rdev, 213 struct radeon_sync *sync, 214 struct radeon_fence *fence) 215 { 216 unsigned i; 217 218 for (i = 0; i < RADEON_NUM_SYNCS; ++i) 219 radeon_semaphore_free(rdev, &sync->semaphores[i], fence); 220 } 221