aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorVille Syrjälä <ville.syrjala@linux.intel.com>2013-06-25 12:21:02 -0400
committerDaniel Vetter <daniel.vetter@ffwll.ch>2013-07-01 05:14:48 -0400
commit80814ae4dae5d2070b1ca848df728feb6a10e6f2 (patch)
tree615107a6b7a14ca91c4cab3e19b6a8084f6dfe60
parent73008b989faf4200907a858f9b902ee29d6edbea (diff)
drm/i915: Don't wait for Punit after each freq change on VLV
It seems that even though Punit reports the frequency change to have been completed, it still reports the old frequency in the status register for some time. So rather than polling for Punit to complete the frequency change after each request, poll before. This gets rid of the spurious "Punit overrode GPU freq" messages. This also lets us continue working while Punit is performing the actual frequency change. As a result, openarena demo088-test1 timedemo average fps is increased by ~5 fps, and the slowest frame duration is reduced by ~25%. The sysfs cur_freq file always reads the current frequency from Punit anyway, so having rps.cur_delay be slightly off at times doesn't matter. Signed-off-by: Ville Syrjälä <ville.syrjala@linux.intel.com> Reviewed-by: Jesse Barnes <jbarnes@virtuousgeek.org> Signed-off-by: Daniel Vetter <daniel.vetter@ffwll.ch>
-rw-r--r--drivers/gpu/drm/i915/intel_pm.c53
1 files changed, 35 insertions, 18 deletions
diff --git a/drivers/gpu/drm/i915/intel_pm.c b/drivers/gpu/drm/i915/intel_pm.c
index 33aa2d6674e5..909dbe1e39fc 100644
--- a/drivers/gpu/drm/i915/intel_pm.c
+++ b/drivers/gpu/drm/i915/intel_pm.c
@@ -3069,17 +3069,49 @@ void gen6_set_rps(struct drm_device *dev, u8 val)
3069 trace_intel_gpu_freq_change(val * 50); 3069 trace_intel_gpu_freq_change(val * 50);
3070} 3070}
3071 3071
3072/*
3073 * Wait until the previous freq change has completed,
3074 * or the timeout elapsed, and then update our notion
3075 * of the current GPU frequency.
3076 */
3077static void vlv_update_rps_cur_delay(struct drm_i915_private *dev_priv)
3078{
3079 unsigned long timeout = jiffies + msecs_to_jiffies(10);
3080 u32 pval;
3081
3082 WARN_ON(!mutex_is_locked(&dev_priv->rps.hw_lock));
3083
3084 do {
3085 pval = vlv_punit_read(dev_priv, PUNIT_REG_GPU_FREQ_STS);
3086 if (time_after(jiffies, timeout)) {
3087 DRM_DEBUG_DRIVER("timed out waiting for Punit\n");
3088 break;
3089 }
3090 udelay(10);
3091 } while (pval & 1);
3092
3093 pval >>= 8;
3094
3095 if (pval != dev_priv->rps.cur_delay)
3096 DRM_DEBUG_DRIVER("Punit overrode GPU freq: %d MHz (%u) requested, but got %d Mhz (%u)\n",
3097 vlv_gpu_freq(dev_priv->mem_freq, dev_priv->rps.cur_delay),
3098 dev_priv->rps.cur_delay,
3099 vlv_gpu_freq(dev_priv->mem_freq, pval), pval);
3100
3101 dev_priv->rps.cur_delay = pval;
3102}
3103
3072void valleyview_set_rps(struct drm_device *dev, u8 val) 3104void valleyview_set_rps(struct drm_device *dev, u8 val)
3073{ 3105{
3074 struct drm_i915_private *dev_priv = dev->dev_private; 3106 struct drm_i915_private *dev_priv = dev->dev_private;
3075 unsigned long timeout = jiffies + msecs_to_jiffies(10);
3076 u32 limits = gen6_rps_limits(dev_priv, &val); 3107 u32 limits = gen6_rps_limits(dev_priv, &val);
3077 u32 pval;
3078 3108
3079 WARN_ON(!mutex_is_locked(&dev_priv->rps.hw_lock)); 3109 WARN_ON(!mutex_is_locked(&dev_priv->rps.hw_lock));
3080 WARN_ON(val > dev_priv->rps.max_delay); 3110 WARN_ON(val > dev_priv->rps.max_delay);
3081 WARN_ON(val < dev_priv->rps.min_delay); 3111 WARN_ON(val < dev_priv->rps.min_delay);
3082 3112
3113 vlv_update_rps_cur_delay(dev_priv);
3114
3083 DRM_DEBUG_DRIVER("GPU freq request from %d MHz (%u) to %d MHz (%u)\n", 3115 DRM_DEBUG_DRIVER("GPU freq request from %d MHz (%u) to %d MHz (%u)\n",
3084 vlv_gpu_freq(dev_priv->mem_freq, 3116 vlv_gpu_freq(dev_priv->mem_freq,
3085 dev_priv->rps.cur_delay), 3117 dev_priv->rps.cur_delay),
@@ -3091,27 +3123,12 @@ void valleyview_set_rps(struct drm_device *dev, u8 val)
3091 3123
3092 vlv_punit_write(dev_priv, PUNIT_REG_GPU_FREQ_REQ, val); 3124 vlv_punit_write(dev_priv, PUNIT_REG_GPU_FREQ_REQ, val);
3093 3125
3094 do {
3095 pval = vlv_punit_read(dev_priv, PUNIT_REG_GPU_FREQ_STS);
3096 if (time_after(jiffies, timeout)) {
3097 DRM_DEBUG_DRIVER("timed out waiting for Punit\n");
3098 break;
3099 }
3100 udelay(10);
3101 } while (pval & 1);
3102
3103 pval = vlv_punit_read(dev_priv, PUNIT_REG_GPU_FREQ_STS);
3104 if ((pval >> 8) != val)
3105 DRM_DEBUG_DRIVER("Punit overrode GPU freq: %d MHz (%u) requested, but got %d Mhz (%u)\n",
3106 vlv_gpu_freq(dev_priv->mem_freq, val), val,
3107 vlv_gpu_freq(dev_priv->mem_freq, pval >> 8), pval >> 8);
3108
3109 /* Make sure we continue to get interrupts 3126 /* Make sure we continue to get interrupts
3110 * until we hit the minimum or maximum frequencies. 3127 * until we hit the minimum or maximum frequencies.
3111 */ 3128 */
3112 I915_WRITE(GEN6_RP_INTERRUPT_LIMITS, limits); 3129 I915_WRITE(GEN6_RP_INTERRUPT_LIMITS, limits);
3113 3130
3114 dev_priv->rps.cur_delay = pval >> 8; 3131 dev_priv->rps.cur_delay = val;
3115 3132
3116 trace_intel_gpu_freq_change(vlv_gpu_freq(dev_priv->mem_freq, val)); 3133 trace_intel_gpu_freq_change(vlv_gpu_freq(dev_priv->mem_freq, val));
3117} 3134}