Re: [PATCH] drm/i915: Adjustable Render Power State policies

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



Hi Jesse,

 When updated your patches(drm/i915: "Scotty, I need more power!"), I found that latest kernel source changed much and can't patch successfully.

e.g.

  This is the kernel source drivers/gpu/drm/i915/intel_pm.c in (drm-intel-next-queued) git-3b27af3:

3331                 DRM_DEBUG_DRIVER("Failed to set the min frequency\n");

3332         }

3333

3334         gen6_set_rps(dev_priv->dev, (gt_perf_status & 0xff00) >> 8);

3335

3336         gen6_enable_rps_interrupts(dev);

3337

3338         rc6vids = 0;

3339         ret = sandybridge_pcode_read(dev_priv, GEN6_PCODE_READ_RC6VIDS, &rc6vids);

 

But in the patch:

--- a/drivers/gpu/drm/i915/intel_pm.c

+++ b/drivers/gpu/drm/i915/intel_pm.c

@@ -3323,19 +3323,25 @@ static void gen6_enable_rps(struct drm_device *dev)

                DRM_DEBUG_DRIVER("Failed to set the min frequency\n");

       }

 

-        gen6_set_rps(dev_priv->dev, (gt_perf_status & 0xff00) >> 8);

-

-        /* requires MSI enabled */

-        I915_WRITE(GEN6_PMIER, I915_READ(GEN6_PMIER) | GEN6_PM_RPS_EVENTS);

-        spin_lock_irq(&dev_priv->rps.lock);

-        /* FIXME: Our interrupt enabling sequence is bonghits.

-        * dev_priv->rps.pm_iir really should be 0 here. */

-        dev_priv->rps.pm_iir = 0;

 

Could you give us new patch that based on latest kernel?

 

 

Thanks,

Meng

 

 

-----Original Message-----
From: Jesse Barnes [mailto:jbarnes@xxxxxxxxxxxxxxxx]
Sent: Saturday, July 27, 2013 6:33 AM
To: Chris Wilson
Cc: intel-gfx@xxxxxxxxxxxxxxxxxxxxx; Zhang, Ouping; Meng, Mengmeng
Subject: Re: [PATCH] drm/i915: Adjustable Render Power State policies

 

Cool... I'd like to see if Ouping and Mengmeng can work together to get power & power numbers across a bunch of workloads for these policies.

 

Ouping & Mengmeng, can you run your usual battery of stuff against each of these settings and report back the results?

 

Thanks,

Jesse

 

On Fri, 26 Jul 2013 23:24:11 +0100

Chris Wilson <chris@xxxxxxxxxxxxxxxxxx> wrote:

 

> As a complement to the suggestions put forward by Jesse in

>

> drm/i915: "Scotty, I need more power!"

> (1372436290-3297-1-git-send-email-jbarnes@xxxxxxxxxxxxxxxx)

>

> and

>

> drm/i915: boost GPU and CPU freq when leaving idle

> (1372438472-3233-1-git-send-email-jbarnes@xxxxxxxxxxxxxxxx)

>

> we also have the ability to fine tune how we respond to the GPU's

> requests for more power.

>

> This patch introduces the i915.rps_policy module parameter that

> adjusts how we respond to the upclock request:

>

>   1 - Powersaving (current implementation)

>       Increase the frequency by one bin on every upclock request.

>

>   2 - Conservative (new default)

>       When waking from idle, boost the render frequency to the

>       default render frequency (RP1)

>

>   3 - Ondemand

>       At every upclock request, increase to halfway between the current

>       frequency and maximum. This should give rapid upclocking similar

>       to tcp window scaling.

>

>   4 - Performance

>       Every time the GPU wants more power, give it everything we have.

>

> Signed-off-by: Chris Wilson <chris@xxxxxxxxxxxxxxxxxx>

> ---

>  drivers/gpu/drm/i915/i915_drv.c |  8 +++++++ 

> drivers/gpu/drm/i915/i915_drv.h |  2 ++ 

> drivers/gpu/drm/i915/i915_irq.c | 46

> +++++++++++++++++++++++++++++------------

>  drivers/gpu/drm/i915/intel_pm.c |  1 +

>  4 files changed, 44 insertions(+), 13 deletions(-)

>

> diff --git a/drivers/gpu/drm/i915/i915_drv.c

> b/drivers/gpu/drm/i915/i915_drv.c index 1d8cedc..7ad80f4 100644

> --- a/drivers/gpu/drm/i915/i915_drv.c

> +++ b/drivers/gpu/drm/i915/i915_drv.c

> @@ -72,6 +72,14 @@ MODULE_PARM_DESC(i915_enable_rc6,

>              "For example, 3 would enable rc6 and deep rc6, and 7 would enable everything. "

>              "default: -1 (use per-chip default)");

> +int i915_rps_policy __read_mostly = 1; module_param_named(rps_policy,

> +i915_rps_policy, int, 0600); MODULE_PARM_DESC(rps_policy,

> +             "Specify a policy to use to respond to requests to change the render clock. "

> +             "Different levels of uplocking agressiveness can be selected"

> +             "(0 = Powersaving, slowly uplock; 1 = Conservative, when the gpu wakes from idle go straight to RP1/RPe (recommended minimum active GPU frequency); 2 = Ondemand, rapidly increase frequency whilst upclocking; 4 = Performance, always upclock to maximum frequency). "

> +             "default: 1 (Conservative)");

> +

>  int i915_enable_fbc __read_mostly = -1; 

> module_param_named(i915_enable_fbc, i915_enable_fbc, int, 0600); 

> MODULE_PARM_DESC(i915_enable_fbc, diff --git

> a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h

> index ec14124..71232bc 100644

> --- a/drivers/gpu/drm/i915/i915_drv.h

> +++ b/drivers/gpu/drm/i915/i915_drv.h

> @@ -811,6 +811,7 @@ struct intel_gen6_power_mgmt {

>    u8 min_delay;

>    u8 max_delay;

>    u8 rpe_delay;

> +    u8 rp1_delay;

>    u8 hw_max;

>    struct delayed_work delayed_resume_work; @@ -1635,6 +1636,7 @@

> extern int i915_lvds_channel_mode __read_mostly;  extern int

> i915_panel_use_ssc __read_mostly;  extern int i915_vbt_sdvo_panel_type

> __read_mostly;  extern int i915_enable_rc6 __read_mostly;

> +extern int i915_rps_policy __read_mostly;

>  extern int i915_enable_fbc __read_mostly;  extern bool

> i915_enable_hangcheck __read_mostly;  extern int i915_enable_ppgtt

> __read_mostly; diff --git a/drivers/gpu/drm/i915/i915_irq.c

> b/drivers/gpu/drm/i915/i915_irq.c index ee3e49c..edd73c0 100644

> --- a/drivers/gpu/drm/i915/i915_irq.c

> +++ b/drivers/gpu/drm/i915/i915_irq.c

> @@ -728,14 +728,32 @@ static void gen6_pm_rps_work(struct work_struct *work)

>    mutex_lock(&dev_priv->rps.hw_lock);

>    if (pm_iir & GEN6_PM_RP_UP_THRESHOLD) {

> -              new_delay = dev_priv->rps.cur_delay + 1;

> +             switch (i915_rps_policy) {

> +             case 0: /* Powersave, slow increase in frequency */

> +                      new_delay = dev_priv->rps.cur_delay + 1;

> +                      break;

> +

> +             case 1: /* Conservative, jump directly to RPe */

> +                      new_delay = dev_priv->rps.rp1_delay;

> +                      if (dev_priv->rps.cur_delay >= new_delay)

> +                                new_delay = dev_priv->rps.cur_delay + 1;

> +                      break;

> +

> +             case 2: /* Ondemand, halfway to maximum */

> +                      new_delay = dev_priv->rps.cur_delay + 1;

> +                      if (new_delay < dev_priv->rps.rp1_delay)

> +                                new_delay = dev_priv->rps.rp1_delay;

> +                      else

> +                                new_delay = (dev_priv->rps.max_delay + new_delay) >> 1;

> +                      break;

> +

> +             default: /* Performance, straight to maximum */

> +                      new_delay = dev_priv->rps.max_delay;

> +                      break;

> +             }

> -              /*

> -              * For better performance, jump directly

> -              * to RPe if we're below it.

> -              */

>              if (IS_VALLEYVIEW(dev_priv->dev) &&

> -                  dev_priv->rps.cur_delay < dev_priv->rps.rpe_delay)

> +                 new_delay < dev_priv->rps.rpe_delay)

>                       new_delay = dev_priv->rps.rpe_delay;

>    } else

>              new_delay = dev_priv->rps.cur_delay - 1; @@ -743,13 +761,15 @@

> static void gen6_pm_rps_work(struct work_struct *work)

>    /* sysfs frequency interfaces may have snuck in while servicing the

>     * interrupt

>     */

> -     if (new_delay >= dev_priv->rps.min_delay &&

> -         new_delay <= dev_priv->rps.max_delay) {

> -              if (IS_VALLEYVIEW(dev_priv->dev))

> -                       valleyview_set_rps(dev_priv->dev, new_delay);

> -              else

> -                       gen6_set_rps(dev_priv->dev, new_delay);

> -     }

> +    if (new_delay < dev_priv->rps.min_delay)

> +             new_delay = dev_priv->rps.min_delay;

> +    if (new_delay > dev_priv->rps.max_delay)

> +             new_delay = dev_priv->rps.max_delay;

> +

> +    if (IS_VALLEYVIEW(dev_priv->dev))

> +             valleyview_set_rps(dev_priv->dev, new_delay);

> +    else

> +             gen6_set_rps(dev_priv->dev, new_delay);

>    if (IS_VALLEYVIEW(dev_priv->dev)) {

>              /*

> diff --git a/drivers/gpu/drm/i915/intel_pm.c

> b/drivers/gpu/drm/i915/intel_pm.c index 4e6d618..e9e467c 100644

> --- a/drivers/gpu/drm/i915/intel_pm.c

> +++ b/drivers/gpu/drm/i915/intel_pm.c

> @@ -3242,6 +3242,7 @@ static void gen6_enable_rps(struct drm_device *dev)

>    /* In units of 50MHz */

>    dev_priv->rps.hw_max = dev_priv->rps.max_delay = rp_state_cap & 0xff;

>    dev_priv->rps.min_delay = (rp_state_cap & 0xff0000) >> 16;

> +    dev_priv->rps.rp1_delay = (rp_state_cap & 0xff00) >> 8;

>    dev_priv->rps.cur_delay = 0;

>    /* disable the counters and set deterministic thresholds */

 

 

--

Jesse Barnes, Intel Open Source Technology Center

_______________________________________________
Intel-gfx mailing list
Intel-gfx@xxxxxxxxxxxxxxxxxxxxx
http://lists.freedesktop.org/mailman/listinfo/intel-gfx

[Index of Archives]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]
  Powered by Linux