aboutsummaryrefslogtreecommitdiffstats
path: root/drivers/gpu/drm/radeon/r600.c
diff options
context:
space:
mode:
authorMatthew Dawson <matthew@mjdsystems.ca>2016-02-07 16:51:12 -0500
committerAlex Deucher <alexander.deucher@amd.com>2016-02-10 14:17:15 -0500
commit04db4caf5c836c211977a54c9218f2cdee14897f (patch)
tree99460f045362a3d7bae6b9d1c64843f85cd19107 /drivers/gpu/drm/radeon/r600.c
parent6e9821b26dd45b4a3e30c4219be2abd802563379 (diff)
drm/radeon: Avoid double gpu reset by adding a timeout on IB ring tests.
When the radeon driver resets a gpu, it attempts to test whether all the rings can successfully handle an IB. If these rings fail to respond, the process will wait forever. Another gpu reset can't happen at this point, as the current reset holds a lock required to do so. Instead, make all the IB tests run with a timeout, so the system can attempt to recover in this case. While this doesn't fix the underlying issue with card resets failing, it gives the system a higher chance of recovering. These timeouts have been confirmed to help both a Tathi and Hawaii card recover after a gpu reset. This also adds a new function, radeon_fence_wait_timeout, that behaves like fence_wait_timeout. It is used instead of fence_wait_timeout as it continues to work during a reset. radeon_fence_wait is changed to be implemented using this function. V2: - Changed the timeout to 1s, as the default 10s from radeon_wait_timeout was too long. A timeout of 100ms was tested and found to be too short. - Changed radeon_fence_wait_timeout to behave more like fence_wait_timeout. Reviewed-by: Christian König <christian.koenig@amd.com> Signed-off-by: Matthew Dawson <matthew@mjdsystems.ca> Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
Diffstat (limited to 'drivers/gpu/drm/radeon/r600.c')
-rw-r--r--drivers/gpu/drm/radeon/r600.c10
1 files changed, 8 insertions, 2 deletions
diff --git a/drivers/gpu/drm/radeon/r600.c b/drivers/gpu/drm/radeon/r600.c
index cc2fdf0be37a..ed121042247f 100644
--- a/drivers/gpu/drm/radeon/r600.c
+++ b/drivers/gpu/drm/radeon/r600.c
@@ -3381,11 +3381,17 @@ int r600_ib_test(struct radeon_device *rdev, struct radeon_ring *ring)
3381 DRM_ERROR("radeon: failed to schedule ib (%d).\n", r); 3381 DRM_ERROR("radeon: failed to schedule ib (%d).\n", r);
3382 goto free_ib; 3382 goto free_ib;
3383 } 3383 }
3384 r = radeon_fence_wait(ib.fence, false); 3384 r = radeon_fence_wait_timeout(ib.fence, false, usecs_to_jiffies(
3385 if (r) { 3385 RADEON_USEC_IB_TEST_TIMEOUT));
3386 if (r < 0) {
3386 DRM_ERROR("radeon: fence wait failed (%d).\n", r); 3387 DRM_ERROR("radeon: fence wait failed (%d).\n", r);
3387 goto free_ib; 3388 goto free_ib;
3389 } else if (r == 0) {
3390 DRM_ERROR("radeon: fence wait timed out.\n");
3391 r = -ETIMEDOUT;
3392 goto free_ib;
3388 } 3393 }
3394 r = 0;
3389 for (i = 0; i < rdev->usec_timeout; i++) { 3395 for (i = 0; i < rdev->usec_timeout; i++) {
3390 tmp = RREG32(scratch); 3396 tmp = RREG32(scratch);
3391 if (tmp == 0xDEADBEEF) 3397 if (tmp == 0xDEADBEEF)