diff mbox

[01/25] drm/i915/fbc: wait for a vblank instead of 50ms when enabling

Message ID 1453210558-7875-2-git-send-email-paulo.r.zanoni@intel.com (mailing list archive)
State New, archived
Headers show

Commit Message

Zanoni, Paulo R Jan. 19, 2016, 1:35 p.m. UTC
Instead of waiting for 50ms, just wait until the next vblank, since
it's the minimum requirement. The whole infrastructure of FBC is based
on vblanks, so waiting for X vblanks instead of X milliseconds sounds
like the correct way to go. Besides, 50ms may be less than a vblank on
super slow modes that may or may not exist.

There are some small improvements in PC state residency (due to the
fact that we're now using 16ms for the common modes instead of 50ms),
but the biggest advantage is still the correctness of being
vblank-based instead of time-based.

v2:
  - Rebase after changing the patch order.
  - Update the commit message.
v3:
  - Fix bogus vblank_get() instead of vblank_count() (Ville).
  - Don't forget to call drm_crtc_vblank_{get,put} (Chris, Ville)
  - Adjust the performance details on the commit message.

Signed-off-by: Paulo Zanoni <paulo.r.zanoni@intel.com>
---
 drivers/gpu/drm/i915/i915_drv.h  |  2 +-
 drivers/gpu/drm/i915/intel_fbc.c | 43 ++++++++++++++++++++++++++++------------
 2 files changed, 31 insertions(+), 14 deletions(-)

Comments

Maarten Lankhorst Jan. 21, 2016, 2:17 p.m. UTC | #1
Op 19-01-16 om 14:35 schreef Paulo Zanoni:
> Instead of waiting for 50ms, just wait until the next vblank, since
> it's the minimum requirement. The whole infrastructure of FBC is based
> on vblanks, so waiting for X vblanks instead of X milliseconds sounds
> like the correct way to go. Besides, 50ms may be less than a vblank on
> super slow modes that may or may not exist.
>
> There are some small improvements in PC state residency (due to the
> fact that we're now using 16ms for the common modes instead of 50ms),
> but the biggest advantage is still the correctness of being
> vblank-based instead of time-based.
>
> v2:
>   - Rebase after changing the patch order.
>   - Update the commit message.
> v3:
>   - Fix bogus vblank_get() instead of vblank_count() (Ville).
>   - Don't forget to call drm_crtc_vblank_{get,put} (Chris, Ville)
>   - Adjust the performance details on the commit message.
>
> Signed-off-by: Paulo Zanoni <paulo.r.zanoni@intel.com>
> ---
>  drivers/gpu/drm/i915/i915_drv.h  |  2 +-
>  drivers/gpu/drm/i915/intel_fbc.c | 43 ++++++++++++++++++++++++++++------------
>  2 files changed, 31 insertions(+), 14 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index af30148..33217a4 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -925,9 +925,9 @@ struct i915_fbc {
>  
>  	struct intel_fbc_work {
>  		bool scheduled;
> +		u32 scheduled_vblank;
>  		struct work_struct work;
>  		struct drm_framebuffer *fb;
> -		unsigned long enable_jiffies;
>  	} work;
>  
>  	const char *no_fbc_reason;
> diff --git a/drivers/gpu/drm/i915/intel_fbc.c b/drivers/gpu/drm/i915/intel_fbc.c
> index a1988a4..6b43ec3 100644
> --- a/drivers/gpu/drm/i915/intel_fbc.c
> +++ b/drivers/gpu/drm/i915/intel_fbc.c
> @@ -381,7 +381,15 @@ static void intel_fbc_work_fn(struct work_struct *__work)
>  		container_of(__work, struct drm_i915_private, fbc.work.work);
>  	struct intel_fbc_work *work = &dev_priv->fbc.work;
>  	struct intel_crtc *crtc = dev_priv->fbc.crtc;
> -	int delay_ms = 50;
> +	struct drm_vblank_crtc *vblank = &dev_priv->dev->vblank[crtc->pipe];
> +
> +	mutex_lock(&dev_priv->fbc.lock);
> +	if (drm_crtc_vblank_get(&crtc->base)) {
> +		DRM_ERROR("vblank not available for FBC on pipe %c\n",
> +			  pipe_name(crtc->pipe));
> +		goto out;
> +	}
> +	mutex_unlock(&dev_priv->fbc.lock);
What does the lock protect here?

~Maarten
Zanoni, Paulo R Jan. 21, 2016, 4:56 p.m. UTC | #2
Em Qui, 2016-01-21 às 15:17 +0100, Maarten Lankhorst escreveu:
> Op 19-01-16 om 14:35 schreef Paulo Zanoni:

> > Instead of waiting for 50ms, just wait until the next vblank, since

> > it's the minimum requirement. The whole infrastructure of FBC is

> > based

> > on vblanks, so waiting for X vblanks instead of X milliseconds

> > sounds

> > like the correct way to go. Besides, 50ms may be less than a vblank

> > on

> > super slow modes that may or may not exist.

> > 

> > There are some small improvements in PC state residency (due to the

> > fact that we're now using 16ms for the common modes instead of

> > 50ms),

> > but the biggest advantage is still the correctness of being

> > vblank-based instead of time-based.

> > 

> > v2:

> >   - Rebase after changing the patch order.

> >   - Update the commit message.

> > v3:

> >   - Fix bogus vblank_get() instead of vblank_count() (Ville).

> >   - Don't forget to call drm_crtc_vblank_{get,put} (Chris, Ville)

> >   - Adjust the performance details on the commit message.

> > 

> > Signed-off-by: Paulo Zanoni <paulo.r.zanoni@intel.com>

> > ---

> >  drivers/gpu/drm/i915/i915_drv.h  |  2 +-

> >  drivers/gpu/drm/i915/intel_fbc.c | 43

> > ++++++++++++++++++++++++++++------------

> >  2 files changed, 31 insertions(+), 14 deletions(-)

> > 

> > diff --git a/drivers/gpu/drm/i915/i915_drv.h

> > b/drivers/gpu/drm/i915/i915_drv.h

> > index af30148..33217a4 100644

> > --- a/drivers/gpu/drm/i915/i915_drv.h

> > +++ b/drivers/gpu/drm/i915/i915_drv.h

> > @@ -925,9 +925,9 @@ struct i915_fbc {

> >  

> >  	struct intel_fbc_work {

> >  		bool scheduled;

> > +		u32 scheduled_vblank;

> >  		struct work_struct work;

> >  		struct drm_framebuffer *fb;

> > -		unsigned long enable_jiffies;

> >  	} work;

> >  

> >  	const char *no_fbc_reason;

> > diff --git a/drivers/gpu/drm/i915/intel_fbc.c

> > b/drivers/gpu/drm/i915/intel_fbc.c

> > index a1988a4..6b43ec3 100644

> > --- a/drivers/gpu/drm/i915/intel_fbc.c

> > +++ b/drivers/gpu/drm/i915/intel_fbc.c

> > @@ -381,7 +381,15 @@ static void intel_fbc_work_fn(struct

> > work_struct *__work)

> >  		container_of(__work, struct drm_i915_private,

> > fbc.work.work);

> >  	struct intel_fbc_work *work = &dev_priv->fbc.work;

> >  	struct intel_crtc *crtc = dev_priv->fbc.crtc;

> > -	int delay_ms = 50;

> > +	struct drm_vblank_crtc *vblank = &dev_priv->dev-

> > >vblank[crtc->pipe];

> > +

> > +	mutex_lock(&dev_priv->fbc.lock);

> > +	if (drm_crtc_vblank_get(&crtc->base)) {

> > +		DRM_ERROR("vblank not available for FBC on pipe

> > %c\n",

> > +			  pipe_name(crtc->pipe));

> > +		goto out;

> > +	}

> > +	mutex_unlock(&dev_priv->fbc.lock);

> What does the lock protect here?


Hmmm, yeah, it protects nothing... Well observed.

> 

> ~Maarten

> _______________________________________________

> Intel-gfx mailing list

> Intel-gfx@lists.freedesktop.org

> http://lists.freedesktop.org/mailman/listinfo/intel-gfx
diff mbox

Patch

diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
index af30148..33217a4 100644
--- a/drivers/gpu/drm/i915/i915_drv.h
+++ b/drivers/gpu/drm/i915/i915_drv.h
@@ -925,9 +925,9 @@  struct i915_fbc {
 
 	struct intel_fbc_work {
 		bool scheduled;
+		u32 scheduled_vblank;
 		struct work_struct work;
 		struct drm_framebuffer *fb;
-		unsigned long enable_jiffies;
 	} work;
 
 	const char *no_fbc_reason;
diff --git a/drivers/gpu/drm/i915/intel_fbc.c b/drivers/gpu/drm/i915/intel_fbc.c
index a1988a4..6b43ec3 100644
--- a/drivers/gpu/drm/i915/intel_fbc.c
+++ b/drivers/gpu/drm/i915/intel_fbc.c
@@ -381,7 +381,15 @@  static void intel_fbc_work_fn(struct work_struct *__work)
 		container_of(__work, struct drm_i915_private, fbc.work.work);
 	struct intel_fbc_work *work = &dev_priv->fbc.work;
 	struct intel_crtc *crtc = dev_priv->fbc.crtc;
-	int delay_ms = 50;
+	struct drm_vblank_crtc *vblank = &dev_priv->dev->vblank[crtc->pipe];
+
+	mutex_lock(&dev_priv->fbc.lock);
+	if (drm_crtc_vblank_get(&crtc->base)) {
+		DRM_ERROR("vblank not available for FBC on pipe %c\n",
+			  pipe_name(crtc->pipe));
+		goto out;
+	}
+	mutex_unlock(&dev_priv->fbc.lock);
 
 retry:
 	/* Delay the actual enabling to let pageflipping cease and the
@@ -390,24 +398,25 @@  retry:
 	 * vblank to pass after disabling the FBC before we attempt
 	 * to modify the control registers.
 	 *
-	 * A more complicated solution would involve tracking vblanks
-	 * following the termination of the page-flipping sequence
-	 * and indeed performing the enable as a co-routine and not
-	 * waiting synchronously upon the vblank.
-	 *
 	 * WaFbcWaitForVBlankBeforeEnable:ilk,snb
+	 *
+	 * It is also worth mentioning that since work->scheduled_vblank can be
+	 * updated multiple times by the other threads, hitting the timeout is
+	 * not an error condition. We'll just end up hitting the "goto retry"
+	 * case below.
 	 */
-	wait_remaining_ms_from_jiffies(work->enable_jiffies, delay_ms);
+	wait_event_timeout(vblank->queue,
+		drm_crtc_vblank_count(&crtc->base) != work->scheduled_vblank,
+		msecs_to_jiffies(50));
 
 	mutex_lock(&dev_priv->fbc.lock);
 
 	/* Were we cancelled? */
 	if (!work->scheduled)
-		goto out;
+		goto out_put;
 
 	/* Were we delayed again while this function was sleeping? */
-	if (time_after(work->enable_jiffies + msecs_to_jiffies(delay_ms),
-		       jiffies)) {
+	if (drm_crtc_vblank_count(&crtc->base) == work->scheduled_vblank) {
 		mutex_unlock(&dev_priv->fbc.lock);
 		goto retry;
 	}
@@ -415,9 +424,10 @@  retry:
 	if (crtc->base.primary->fb == work->fb)
 		intel_fbc_activate(work->fb);
 
-	work->scheduled = false;
-
+out_put:
+	drm_crtc_vblank_put(&crtc->base);
 out:
+	work->scheduled = false;
 	mutex_unlock(&dev_priv->fbc.lock);
 }
 
@@ -434,13 +444,20 @@  static void intel_fbc_schedule_activation(struct intel_crtc *crtc)
 
 	WARN_ON(!mutex_is_locked(&dev_priv->fbc.lock));
 
+	if (drm_crtc_vblank_get(&crtc->base)) {
+		DRM_ERROR("vblank not available for FBC on pipe %c\n",
+			  pipe_name(crtc->pipe));
+		return;
+	}
+
 	/* It is useless to call intel_fbc_cancel_work() in this function since
 	 * we're not releasing fbc.lock, so it won't have an opportunity to grab
 	 * it to discover that it was cancelled. So we just update the expected
 	 * jiffy count. */
 	work->fb = crtc->base.primary->fb;
 	work->scheduled = true;
-	work->enable_jiffies = jiffies;
+	work->scheduled_vblank = drm_crtc_vblank_count(&crtc->base);
+	drm_crtc_vblank_put(&crtc->base);
 
 	schedule_work(&work->work);
 }