diff options
author | Christian König <christian.koenig@amd.com> | 2014-08-27 09:21:58 -0400 |
---|---|---|
committer | Alex Deucher <alexander.deucher@amd.com> | 2014-08-27 17:42:11 -0400 |
commit | 0bfa4b41268ad5fd741f16f484e4fee190822ec6 (patch) | |
tree | 670093f179cd39a4dcf555a85074235b95bbea99 /drivers/gpu | |
parent | 9bb39ff43e15e85bc1bd9bbbdc5b9cef7a670fd5 (diff) |
drm/radeon: handle lockup in delayed work, v5
v5 (chk): complete rework, start when the first fence is emitted,
stop when the last fence is signalled, make it work
correctly with GPU resets, cleanup radeon_fence_wait_seq
Signed-off-by: Maarten Lankhorst <maarten.lankhorst@canonical.com>
Signed-off-by: Christian König <christian.koenig@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
Diffstat (limited to 'drivers/gpu')
-rw-r--r-- | drivers/gpu/drm/radeon/radeon.h | 2 | ||||
-rw-r--r-- | drivers/gpu/drm/radeon/radeon_fence.c | 200 |
2 files changed, 124 insertions, 78 deletions
diff --git a/drivers/gpu/drm/radeon/radeon.h b/drivers/gpu/drm/radeon/radeon.h index 8cd1b3f60d4a..74919ef57ac3 100644 --- a/drivers/gpu/drm/radeon/radeon.h +++ b/drivers/gpu/drm/radeon/radeon.h | |||
@@ -350,6 +350,7 @@ extern void evergreen_tiling_fields(unsigned tiling_flags, unsigned *bankw, | |||
350 | * Fences. | 350 | * Fences. |
351 | */ | 351 | */ |
352 | struct radeon_fence_driver { | 352 | struct radeon_fence_driver { |
353 | struct radeon_device *rdev; | ||
353 | uint32_t scratch_reg; | 354 | uint32_t scratch_reg; |
354 | uint64_t gpu_addr; | 355 | uint64_t gpu_addr; |
355 | volatile uint32_t *cpu_addr; | 356 | volatile uint32_t *cpu_addr; |
@@ -357,6 +358,7 @@ struct radeon_fence_driver { | |||
357 | uint64_t sync_seq[RADEON_NUM_RINGS]; | 358 | uint64_t sync_seq[RADEON_NUM_RINGS]; |
358 | atomic64_t last_seq; | 359 | atomic64_t last_seq; |
359 | bool initialized; | 360 | bool initialized; |
361 | struct delayed_work lockup_work; | ||
360 | }; | 362 | }; |
361 | 363 | ||
362 | struct radeon_fence { | 364 | struct radeon_fence { |
diff --git a/drivers/gpu/drm/radeon/radeon_fence.c b/drivers/gpu/drm/radeon/radeon_fence.c index e8a28e7b39c7..ac15f3418478 100644 --- a/drivers/gpu/drm/radeon/radeon_fence.c +++ b/drivers/gpu/drm/radeon/radeon_fence.c | |||
@@ -98,6 +98,25 @@ static u32 radeon_fence_read(struct radeon_device *rdev, int ring) | |||
98 | } | 98 | } |
99 | 99 | ||
100 | /** | 100 | /** |
101 | * radeon_fence_schedule_check - schedule lockup check | ||
102 | * | ||
103 | * @rdev: radeon_device pointer | ||
104 | * @ring: ring index we should work with | ||
105 | * | ||
106 | * Queues a delayed work item to check for lockups. | ||
107 | */ | ||
108 | static void radeon_fence_schedule_check(struct radeon_device *rdev, int ring) | ||
109 | { | ||
110 | /* | ||
111 | * Do not reset the timer here with mod_delayed_work, | ||
112 | * this can livelock in an interaction with TTM delayed destroy. | ||
113 | */ | ||
114 | queue_delayed_work(system_power_efficient_wq, | ||
115 | &rdev->fence_drv[ring].lockup_work, | ||
116 | RADEON_FENCE_JIFFIES_TIMEOUT); | ||
117 | } | ||
118 | |||
119 | /** | ||
101 | * radeon_fence_emit - emit a fence on the requested ring | 120 | * radeon_fence_emit - emit a fence on the requested ring |
102 | * | 121 | * |
103 | * @rdev: radeon_device pointer | 122 | * @rdev: radeon_device pointer |
@@ -122,19 +141,21 @@ int radeon_fence_emit(struct radeon_device *rdev, | |||
122 | (*fence)->ring = ring; | 141 | (*fence)->ring = ring; |
123 | radeon_fence_ring_emit(rdev, ring, *fence); | 142 | radeon_fence_ring_emit(rdev, ring, *fence); |
124 | trace_radeon_fence_emit(rdev->ddev, ring, (*fence)->seq); | 143 | trace_radeon_fence_emit(rdev->ddev, ring, (*fence)->seq); |
144 | radeon_fence_schedule_check(rdev, ring); | ||
125 | return 0; | 145 | return 0; |
126 | } | 146 | } |
127 | 147 | ||
128 | /** | 148 | /** |
129 | * radeon_fence_process - process a fence | 149 | * radeon_fence_activity - check for fence activity |
130 | * | 150 | * |
131 | * @rdev: radeon_device pointer | 151 | * @rdev: radeon_device pointer |
132 | * @ring: ring index the fence is associated with | 152 | * @ring: ring index the fence is associated with |
133 | * | 153 | * |
134 | * Checks the current fence value and wakes the fence queue | 154 | * Checks the current fence value and calculates the last |
135 | * if the sequence number has increased (all asics). | 155 | * signalled fence value. Returns true if activity occured |
156 | * on the ring, and the fence_queue should be waken up. | ||
136 | */ | 157 | */ |
137 | void radeon_fence_process(struct radeon_device *rdev, int ring) | 158 | static bool radeon_fence_activity(struct radeon_device *rdev, int ring) |
138 | { | 159 | { |
139 | uint64_t seq, last_seq, last_emitted; | 160 | uint64_t seq, last_seq, last_emitted; |
140 | unsigned count_loop = 0; | 161 | unsigned count_loop = 0; |
@@ -190,7 +211,67 @@ void radeon_fence_process(struct radeon_device *rdev, int ring) | |||
190 | } | 211 | } |
191 | } while (atomic64_xchg(&rdev->fence_drv[ring].last_seq, seq) > seq); | 212 | } while (atomic64_xchg(&rdev->fence_drv[ring].last_seq, seq) > seq); |
192 | 213 | ||
193 | if (wake) | 214 | if (seq < last_emitted) |
215 | radeon_fence_schedule_check(rdev, ring); | ||
216 | |||
217 | return wake; | ||
218 | } | ||
219 | |||
220 | /** | ||
221 | * radeon_fence_check_lockup - check for hardware lockup | ||
222 | * | ||
223 | * @work: delayed work item | ||
224 | * | ||
225 | * Checks for fence activity and if there is none probe | ||
226 | * the hardware if a lockup occured. | ||
227 | */ | ||
228 | static void radeon_fence_check_lockup(struct work_struct *work) | ||
229 | { | ||
230 | struct radeon_fence_driver *fence_drv; | ||
231 | struct radeon_device *rdev; | ||
232 | int ring; | ||
233 | |||
234 | fence_drv = container_of(work, struct radeon_fence_driver, | ||
235 | lockup_work.work); | ||
236 | rdev = fence_drv->rdev; | ||
237 | ring = fence_drv - &rdev->fence_drv[0]; | ||
238 | |||
239 | if (!down_read_trylock(&rdev->exclusive_lock)) { | ||
240 | /* just reschedule the check if a reset is going on */ | ||
241 | radeon_fence_schedule_check(rdev, ring); | ||
242 | return; | ||
243 | } | ||
244 | |||
245 | if (radeon_fence_activity(rdev, ring)) | ||
246 | wake_up_all(&rdev->fence_queue); | ||
247 | |||
248 | else if (radeon_ring_is_lockup(rdev, ring, &rdev->ring[ring])) { | ||
249 | |||
250 | /* good news we believe it's a lockup */ | ||
251 | dev_warn(rdev->dev, "GPU lockup (current fence id " | ||
252 | "0x%016llx last fence id 0x%016llx on ring %d)\n", | ||
253 | (uint64_t)atomic64_read(&fence_drv->last_seq), | ||
254 | fence_drv->sync_seq[ring], ring); | ||
255 | |||
256 | /* remember that we need an reset */ | ||
257 | rdev->needs_reset = true; | ||
258 | wake_up_all(&rdev->fence_queue); | ||
259 | } | ||
260 | up_read(&rdev->exclusive_lock); | ||
261 | } | ||
262 | |||
263 | /** | ||
264 | * radeon_fence_process - process a fence | ||
265 | * | ||
266 | * @rdev: radeon_device pointer | ||
267 | * @ring: ring index the fence is associated with | ||
268 | * | ||
269 | * Checks the current fence value and wakes the fence queue | ||
270 | * if the sequence number has increased (all asics). | ||
271 | */ | ||
272 | void radeon_fence_process(struct radeon_device *rdev, int ring) | ||
273 | { | ||
274 | if (radeon_fence_activity(rdev, ring)) | ||
194 | wake_up_all(&rdev->fence_queue); | 275 | wake_up_all(&rdev->fence_queue); |
195 | } | 276 | } |
196 | 277 | ||
@@ -300,86 +381,43 @@ static bool radeon_fence_any_seq_signaled(struct radeon_device *rdev, u64 *seq) | |||
300 | static int radeon_fence_wait_seq(struct radeon_device *rdev, u64 *target_seq, | 381 | static int radeon_fence_wait_seq(struct radeon_device *rdev, u64 *target_seq, |
301 | bool intr) | 382 | bool intr) |
302 | { | 383 | { |
303 | uint64_t last_seq[RADEON_NUM_RINGS]; | 384 | long r; |
304 | bool signaled; | 385 | int i; |
305 | int i, r; | ||
306 | |||
307 | while (!radeon_fence_any_seq_signaled(rdev, target_seq)) { | ||
308 | 386 | ||
309 | /* Save current sequence values, used to check for GPU lockups */ | 387 | if (radeon_fence_any_seq_signaled(rdev, target_seq)) |
310 | for (i = 0; i < RADEON_NUM_RINGS; ++i) { | 388 | return 0; |
311 | if (!target_seq[i]) | ||
312 | continue; | ||
313 | 389 | ||
314 | last_seq[i] = atomic64_read(&rdev->fence_drv[i].last_seq); | 390 | /* enable IRQs and tracing */ |
315 | trace_radeon_fence_wait_begin(rdev->ddev, i, target_seq[i]); | 391 | for (i = 0; i < RADEON_NUM_RINGS; ++i) { |
316 | radeon_irq_kms_sw_irq_get(rdev, i); | 392 | if (!target_seq[i]) |
317 | } | 393 | continue; |
318 | 394 | ||
319 | if (intr) { | 395 | trace_radeon_fence_wait_begin(rdev->ddev, i, target_seq[i]); |
320 | r = wait_event_interruptible_timeout(rdev->fence_queue, ( | 396 | radeon_irq_kms_sw_irq_get(rdev, i); |
321 | (signaled = radeon_fence_any_seq_signaled(rdev, target_seq)) | 397 | } |
322 | || rdev->needs_reset), RADEON_FENCE_JIFFIES_TIMEOUT); | ||
323 | } else { | ||
324 | r = wait_event_timeout(rdev->fence_queue, ( | ||
325 | (signaled = radeon_fence_any_seq_signaled(rdev, target_seq)) | ||
326 | || rdev->needs_reset), RADEON_FENCE_JIFFIES_TIMEOUT); | ||
327 | } | ||
328 | 398 | ||
329 | for (i = 0; i < RADEON_NUM_RINGS; ++i) { | 399 | if (intr) { |
330 | if (!target_seq[i]) | 400 | r = wait_event_interruptible_timeout(rdev->fence_queue, ( |
331 | continue; | 401 | radeon_fence_any_seq_signaled(rdev, target_seq) |
402 | || rdev->needs_reset), MAX_SCHEDULE_TIMEOUT); | ||
403 | } else { | ||
404 | r = wait_event_timeout(rdev->fence_queue, ( | ||
405 | radeon_fence_any_seq_signaled(rdev, target_seq) | ||
406 | || rdev->needs_reset), MAX_SCHEDULE_TIMEOUT); | ||
407 | } | ||
332 | 408 | ||
333 | radeon_irq_kms_sw_irq_put(rdev, i); | 409 | if (rdev->needs_reset) |
334 | trace_radeon_fence_wait_end(rdev->ddev, i, target_seq[i]); | 410 | r = -EDEADLK; |
335 | } | ||
336 | 411 | ||
337 | if (unlikely(r < 0)) | 412 | for (i = 0; i < RADEON_NUM_RINGS; ++i) { |
338 | return r; | 413 | if (!target_seq[i]) |
414 | continue; | ||
339 | 415 | ||
340 | if (unlikely(!signaled)) { | 416 | radeon_irq_kms_sw_irq_put(rdev, i); |
341 | if (rdev->needs_reset) | 417 | trace_radeon_fence_wait_end(rdev->ddev, i, target_seq[i]); |
342 | return -EDEADLK; | ||
343 | |||
344 | /* we were interrupted for some reason and fence | ||
345 | * isn't signaled yet, resume waiting */ | ||
346 | if (r) | ||
347 | continue; | ||
348 | |||
349 | for (i = 0; i < RADEON_NUM_RINGS; ++i) { | ||
350 | if (!target_seq[i]) | ||
351 | continue; | ||
352 | |||
353 | if (last_seq[i] != atomic64_read(&rdev->fence_drv[i].last_seq)) | ||
354 | break; | ||
355 | } | ||
356 | |||
357 | if (i != RADEON_NUM_RINGS) | ||
358 | continue; | ||
359 | |||
360 | for (i = 0; i < RADEON_NUM_RINGS; ++i) { | ||
361 | if (!target_seq[i]) | ||
362 | continue; | ||
363 | |||
364 | if (radeon_ring_is_lockup(rdev, i, &rdev->ring[i])) | ||
365 | break; | ||
366 | } | ||
367 | |||
368 | if (i < RADEON_NUM_RINGS) { | ||
369 | /* good news we believe it's a lockup */ | ||
370 | dev_warn(rdev->dev, "GPU lockup (waiting for " | ||
371 | "0x%016llx last fence id 0x%016llx on" | ||
372 | " ring %d)\n", | ||
373 | target_seq[i], last_seq[i], i); | ||
374 | |||
375 | /* remember that we need an reset */ | ||
376 | rdev->needs_reset = true; | ||
377 | wake_up_all(&rdev->fence_queue); | ||
378 | return -EDEADLK; | ||
379 | } | ||
380 | } | ||
381 | } | 418 | } |
382 | return 0; | 419 | |
420 | return r < 0 ? r : 0; | ||
383 | } | 421 | } |
384 | 422 | ||
385 | /** | 423 | /** |
@@ -711,6 +749,9 @@ static void radeon_fence_driver_init_ring(struct radeon_device *rdev, int ring) | |||
711 | rdev->fence_drv[ring].sync_seq[i] = 0; | 749 | rdev->fence_drv[ring].sync_seq[i] = 0; |
712 | atomic64_set(&rdev->fence_drv[ring].last_seq, 0); | 750 | atomic64_set(&rdev->fence_drv[ring].last_seq, 0); |
713 | rdev->fence_drv[ring].initialized = false; | 751 | rdev->fence_drv[ring].initialized = false; |
752 | INIT_DELAYED_WORK(&rdev->fence_drv[ring].lockup_work, | ||
753 | radeon_fence_check_lockup); | ||
754 | rdev->fence_drv[ring].rdev = rdev; | ||
714 | } | 755 | } |
715 | 756 | ||
716 | /** | 757 | /** |
@@ -760,6 +801,7 @@ void radeon_fence_driver_fini(struct radeon_device *rdev) | |||
760 | /* no need to trigger GPU reset as we are unloading */ | 801 | /* no need to trigger GPU reset as we are unloading */ |
761 | radeon_fence_driver_force_completion(rdev, ring); | 802 | radeon_fence_driver_force_completion(rdev, ring); |
762 | } | 803 | } |
804 | cancel_delayed_work_sync(&rdev->fence_drv[ring].lockup_work); | ||
763 | wake_up_all(&rdev->fence_queue); | 805 | wake_up_all(&rdev->fence_queue); |
764 | radeon_scratch_free(rdev, rdev->fence_drv[ring].scratch_reg); | 806 | radeon_scratch_free(rdev, rdev->fence_drv[ring].scratch_reg); |
765 | rdev->fence_drv[ring].initialized = false; | 807 | rdev->fence_drv[ring].initialized = false; |
@@ -778,8 +820,10 @@ void radeon_fence_driver_fini(struct radeon_device *rdev) | |||
778 | */ | 820 | */ |
779 | void radeon_fence_driver_force_completion(struct radeon_device *rdev, int ring) | 821 | void radeon_fence_driver_force_completion(struct radeon_device *rdev, int ring) |
780 | { | 822 | { |
781 | if (rdev->fence_drv[ring].initialized) | 823 | if (rdev->fence_drv[ring].initialized) { |
782 | radeon_fence_write(rdev, rdev->fence_drv[ring].sync_seq[ring], ring); | 824 | radeon_fence_write(rdev, rdev->fence_drv[ring].sync_seq[ring], ring); |
825 | cancel_delayed_work_sync(&rdev->fence_drv[ring].lockup_work); | ||
826 | } | ||
783 | } | 827 | } |
784 | 828 | ||
785 | 829 | ||