Re: [PATCH v6 6/6] drm/i915/skl: Update DDB values atomically with wms/plane attrs

From: Lyude Paul
Date: Wed Aug 03 2016 - 17:39:33 EST


On Wed, 2016-08-03 at 18:00 +0300, Ville SyrjÃlà wrote:
> On Tue, Aug 02, 2016 at 06:37:37PM -0400, Lyude wrote:
> >
> > Now that we can hook into update_crtcs and control the order in which we
> > update CRTCs at each modeset, we can finish the final step of fixing
> > Skylake's watermark handling by performing DDB updates at the same time
> > as plane updates and watermark updates.
> >
> > The first major change in this patch is skl_update_crtcs(), which
> > handles ensuring that we order each CRTC update in our atomic commits
> > properly so that they honor the DDB flush order.
> >
> > The second major change in this patch is the order in which we flush the
> > pipes. While the previous order may have worked, it can't be used in
> > this approach since it no longer will do the right thing. For example,
> > using the old ddb flush order:
> >
> > We have pipes A, B, and C enabled, and we're disabling C. Initial ddb
> > allocation looks like this:
> >
> > >
> > > Â AÂÂÂ|ÂÂÂBÂÂÂ|xxxxxxx|
> >
> > Since we're performing the ddb updates after performing any CRTC
> > disablements in intel_atomic_commit_tail(), the space to the right of
> > pipe B is unallocated.
> >
> > 1. Flush pipes with new allocation contained into old space. None
> > ÂÂÂapply, so we skip this
> > 2. Flush pipes having their allocation reduced, but overlapping with a
> > ÂÂÂprevious allocation. None apply, so we also skip this
> > 3. Flush pipes that got more space allocated. This applies to A and B,
> > ÂÂÂgiving us the following update order: A, B
> >
> > This is wrong, since updating pipe A first will cause it to overlap with
> > B and potentially burst into flames. Our new order (see the code
> > comments for details) would update the pipes in the proper order: B, A.
> >
> > As well, we calculate the order for each DDB update during the check
> > phase, and reference it later in the commit phase when we hit
> > skl_update_crtcs().
> >
> > This long overdue patch fixes the rest of the underruns on Skylake.
> >
> > Changes since v1:
> > Â- Add skl_ddb_entry_write() for cursor into skl_write_cursor_wm()
> >
> > Fixes: 0e8fb7ba7ca5 ("drm/i915/skl: Flush the WM configuration")
> > Fixes: 8211bd5bdf5e ("drm/i915/skl: Program the DDB allocation")
> > Signed-off-by: Lyude <cpaul@xxxxxxxxxx>
> > [omitting CC for stable, since this patch will need to be changed for
> > such backports first]
> > Cc: Ville SyrjÃlà <ville.syrjala@xxxxxxxxxxxxxxx>
> > Cc: Daniel Vetter <daniel.vetter@xxxxxxxxx>
> > Cc: Radhakrishna Sripada <radhakrishna.sripada@xxxxxxxxx>
> > Cc: Hans de Goede <hdegoede@xxxxxxxxxx>
> > Cc: Matt Roper <matthew.d.roper@xxxxxxxxx>
> > ---
> > Âdrivers/gpu/drm/i915/intel_display.c | 100 ++++++++++--
> > Âdrivers/gpu/drm/i915/intel_drv.hÂÂÂÂÂ|ÂÂ10 ++
> > Âdrivers/gpu/drm/i915/intel_pm.cÂÂÂÂÂÂ| 288 ++++++++++++++++--------------
> > -----
> > Â3 files changed, 233 insertions(+), 165 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/i915/intel_display.c
> > b/drivers/gpu/drm/i915/intel_display.c
> > index 59cf513..06295f7 100644
> > --- a/drivers/gpu/drm/i915/intel_display.c
> > +++ b/drivers/gpu/drm/i915/intel_display.c
> > @@ -12897,16 +12897,23 @@ static void verify_wm_state(struct drm_crtc *crtc,
> > Â ÂÂhw_entry->start, hw_entry->end);
> > Â }
> > Â
> > - /* cursor */
> > - hw_entry = &hw_ddb.plane[pipe][PLANE_CURSOR];
> > - sw_entry = &sw_ddb->plane[pipe][PLANE_CURSOR];
> > -
> > - if (!skl_ddb_entry_equal(hw_entry, sw_entry)) {
> > - DRM_ERROR("mismatch in DDB state pipe %c cursor "
> > - ÂÂ"(expected (%u,%u), found (%u,%u))\n",
> > - ÂÂpipe_name(pipe),
> > - ÂÂsw_entry->start, sw_entry->end,
> > - ÂÂhw_entry->start, hw_entry->end);
> > + /*
> > + Â* cursor
> > + Â* If the cursor plane isn't active, we may not have updated it's
> > ddb
> > + Â* allocation. In that case since the ddb allocation will be
> > updated
> > + Â* once the plane becomes visible, we can skip this check
> > + Â*/
> > + if (intel_crtc->cursor_addr) {
> > + hw_entry = &hw_ddb.plane[pipe][PLANE_CURSOR];
> > + sw_entry = &sw_ddb->plane[pipe][PLANE_CURSOR];
> > +
> > + if (!skl_ddb_entry_equal(hw_entry, sw_entry)) {
> > + DRM_ERROR("mismatch in DDB state pipe %c cursor "
> > + ÂÂ"(expected (%u,%u), found (%u,%u))\n",
> > + ÂÂpipe_name(pipe),
> > + ÂÂsw_entry->start, sw_entry->end,
> > + ÂÂhw_entry->start, hw_entry->end);
> > + }
> > Â }
> > Â}
> > Â
> > @@ -13658,6 +13665,72 @@ static void intel_update_crtcs(struct
> > drm_atomic_state *state,
> > Â }
> > Â}
> > Â
> > +static inline void
> > +skl_do_ddb_step(struct drm_atomic_state *state,
> > + enum skl_ddb_step step)
> > +{
> > + struct intel_atomic_state *intel_state =
> > to_intel_atomic_state(state);
> > + struct drm_crtc *crtc;
> > + struct drm_crtc_state *old_crtc_state;
> > + unsigned int crtc_vblank_mask; /* unused */
> > + int i;
> > +
> > + for_each_crtc_in_state(state, crtc, old_crtc_state, i) {
> > + struct intel_crtc *intel_crtc = to_intel_crtc(crtc);
> > + struct intel_crtc_state *cstate =
> > + to_intel_crtc_state(crtc->state);
> > + bool vblank_wait = false;
> > +
> > + if (cstate->wm.skl.ddb_realloc != step || !crtc->state-
> > >active)
> > + continue;
> > +
> > + /*
> > + Â* If we're changing the ddb allocation of this pipe to
> > make
> > + Â* room for another pipe, we have to wait for the pipe's
> > ddb
> > + Â* allocations to actually update by waiting for a vblank.
> > + Â* Otherwise we risk the next pipe updating before this
> > pipe
> > + Â* finishes, resulting in the pipe fetching from ddb space
> > for
> > + Â* the wrong pipe.
> > + Â*
> > + Â* However, if we know we don't have any more pipes to move
> > + Â* around, we can skip this wait and the new ddb allocation
> > + Â* will take effect at the start of the next vblank.
> > + Â*/
> > + switch (step) {
> > + case SKL_DDB_STEP_NO_OVERLAP:
> > + case SKL_DDB_STEP_OVERLAP:
> > + if (step != intel_state->last_ddb_step)
> > + vblank_wait = true;
> > +
> > + /* drop through */
> > + case SKL_DDB_STEP_FINAL:
> > + DRM_DEBUG_KMS(
> > + ÂÂÂÂ"Updating [CRTC:%d:pipe %c] for DDB step %d\n",
> > + ÂÂÂÂcrtc->base.id, pipe_name(intel_crtc->pipe),
> > + ÂÂÂÂstep);
> > +
> > + case SKL_DDB_STEP_NONE:
> > + break;
> > + }
>
> Not sure we really need this step stuff. How about?
>
> for_each_crtc
> if (crtc_needs_disabling)
> disable_crtc();
>
> do {
> progress = false;
> wait_vbl_pipes=0;
> for_each_crtc() {
> if (!active || needs_modeset)
> continue;
> if (!ddb_changed)
> continue;
> if (new_ddb_overlaps_with_any_other_pipes_current_ddb)
> continue;
> commit;
> wait_vbl_pipes |= pipe;
> progress = true;
> }
> wait_vbls(wait_vbl_pipes);
> } while (progress);
>
> for_each_crtc
> if (crtc_needs_enabling)
> enable_crtc();
> commit;
> }

I'm fine with this, it might make this logic a little easier to read.Â
>
> Or if we're paranoid, we could also have an upper bound on the
> loop and assert that we never reach it.
>
>
> Though one thing I don't particularly like about this commit while
> changing the ddb approach is that it's going to make the update
> appear even less atomic. What I'd rather like to do for the normal
> commit path is this:
>
> for_each_crtc
> if (crtc_needs_disabling)
> disable_planes
> for_each_crtc
> if (crtc_needs_disabling)
> disable_crtc
> for_each_crtc
> if (crtc_needs_enabling)
> enable_crtc
> for_each_crtc
> if (active)
> commit_planes;
>
> That way everything would pop in and out as close together as possible.
> Hmm. Actually, I wonder... I'm thinking we should be able to enable all
> crtcs prior to entering the ddb commit loop, on account of no planes
> being enabled on those crtcs until we commit them. And if no planes are
> enabled, running the pipe w/o allocated ddb should be fine. So with that
> approach, I think we should be able to commit all planes within a few
> iterations of the loop, and hence within a few vblanks.

I can't see any issues with this, and this would definitely make the code a lot
cleaner. I'm alright with going this route if matt doesn't see any issues with
it as well.

Cheers,
Lyude

>
> >
> > +
> > + intel_update_crtc(crtc, state, old_crtc_state,
> > + ÂÂ&crtc_vblank_mask);
> > +
> > + if (vblank_wait)
> > + intel_wait_for_vblank(state->dev, intel_crtc-
> > >pipe);
> > + }
> > +}
> > +
> > +static void skl_update_crtcs(struct drm_atomic_state *state,
> > + ÂÂÂÂÂunsigned int *crtc_vblank_mask)
> > +{
> > + struct intel_atomic_state *intel_state =
> > to_intel_atomic_state(state);
> > + enum skl_ddb_step step;
> > +
> > + for (step = 0; step <= intel_state->last_ddb_step; step++)
> > + skl_do_ddb_step(state, step);
> > +}
> > +
> > Âstatic void intel_atomic_commit_tail(struct drm_atomic_state *state)
> > Â{
> > Â struct drm_device *dev = state->dev;
> > @@ -15235,8 +15308,6 @@ void intel_init_display_hooks(struct
> > drm_i915_private *dev_priv)
> > Â dev_priv->display.crtc_disable = i9xx_crtc_disable;
> > Â }
> > Â
> > - dev_priv->display.update_crtcs = intel_update_crtcs;
> > -
> > Â /* Returns the core display clock speed */
> > Â if (IS_SKYLAKE(dev_priv) || IS_KABYLAKE(dev_priv))
> > Â dev_priv->display.get_display_clock_speed =
> > @@ -15326,6 +15397,11 @@ void intel_init_display_hooks(struct
> > drm_i915_private *dev_priv)
> > Â skl_modeset_calc_cdclk;
> > Â }
> > Â
> > + if (dev_priv->info.gen >= 9)
> > + dev_priv->display.update_crtcs = skl_update_crtcs;
> > + else
> > + dev_priv->display.update_crtcs = intel_update_crtcs;
> > +
> > Â switch (INTEL_INFO(dev_priv)->gen) {
> > Â case 2:
> > Â dev_priv->display.queue_flip = intel_gen2_queue_flip;
> > diff --git a/drivers/gpu/drm/i915/intel_drv.h
> > b/drivers/gpu/drm/i915/intel_drv.h
> > index 1b444d3..cf5da83 100644
> > --- a/drivers/gpu/drm/i915/intel_drv.h
> > +++ b/drivers/gpu/drm/i915/intel_drv.h
> > @@ -334,6 +334,7 @@ struct intel_atomic_state {
> > Â
> > Â /* Gen9+ only */
> > Â struct skl_wm_values wm_results;
> > + int last_ddb_step;
> > Â};
> > Â
> > Âstruct intel_plane_state {
> > @@ -437,6 +438,13 @@ struct skl_pipe_wm {
> > Â uint32_t linetime;
> > Â};
> > Â
> > +enum skl_ddb_step {
> > + SKL_DDB_STEP_NONE = 0,
> > + SKL_DDB_STEP_NO_OVERLAP,
> > + SKL_DDB_STEP_OVERLAP,
> > + SKL_DDB_STEP_FINAL
> > +};
> > +
> > Âstruct intel_crtc_wm_state {
> > Â union {
> > Â struct {
> > @@ -467,6 +475,8 @@ struct intel_crtc_wm_state {
> > Â /* minimum block allocation */
> > Â uint16_t minimum_blocks[I915_MAX_PLANES];
> > Â uint16_t minimum_y_blocks[I915_MAX_PLANES];
> > +
> > + enum skl_ddb_step ddb_realloc;
> > Â } skl;
> > Â };
> > Â
> > diff --git a/drivers/gpu/drm/i915/intel_pm.c
> > b/drivers/gpu/drm/i915/intel_pm.c
> > index 6f5beb3..636c90a 100644
> > --- a/drivers/gpu/drm/i915/intel_pm.c
> > +++ b/drivers/gpu/drm/i915/intel_pm.c
> > @@ -3816,6 +3816,11 @@ void skl_write_plane_wm(struct intel_crtc
> > *intel_crtc,
> > Â ÂÂÂwm->plane[pipe][plane][level]);
> > Â }
> > Â I915_WRITE(PLANE_WM_TRANS(pipe, plane), wm-
> > >plane_trans[pipe][plane]);
> > +
> > + skl_ddb_entry_write(dev_priv, PLANE_BUF_CFG(pipe, plane),
> > + ÂÂÂÂ&wm->ddb.plane[pipe][plane]);
> > + skl_ddb_entry_write(dev_priv, PLANE_NV12_BUF_CFG(pipe, plane),
> > + ÂÂÂÂ&wm->ddb.y_plane[pipe][plane]);
> > Â}
> > Â
> > Âvoid skl_write_cursor_wm(struct intel_crtc *intel_crtc,
> > @@ -3832,170 +3837,51 @@ void skl_write_cursor_wm(struct intel_crtc
> > *intel_crtc,
> > Â ÂÂÂwm->plane[pipe][PLANE_CURSOR][level]);
> > Â }
> > Â I915_WRITE(CUR_WM_TRANS(pipe), wm-
> > >plane_trans[pipe][PLANE_CURSOR]);
> > -}
> > -
> > -static void skl_write_wm_values(struct drm_i915_private *dev_priv,
> > - const struct skl_wm_values *new)
> > -{
> > - struct drm_device *dev = &dev_priv->drm;
> > - struct intel_crtc *crtc;
> > -
> > - for_each_intel_crtc(dev, crtc) {
> > - int i;
> > - enum pipe pipe = crtc->pipe;
> > -
> > - if ((new->dirty_pipes & drm_crtc_mask(&crtc->base)) == 0)
> > - continue;
> > - if (!crtc->active)
> > - continue;
> > Â
> > - for (i = 0; i < intel_num_planes(crtc); i++) {
> > - skl_ddb_entry_write(dev_priv,
> > - ÂÂÂÂPLANE_BUF_CFG(pipe, i),
> > - ÂÂÂÂ&new->ddb.plane[pipe][i]);
> > - skl_ddb_entry_write(dev_priv,
> > - ÂÂÂÂPLANE_NV12_BUF_CFG(pipe, i),
> > - ÂÂÂÂ&new->ddb.y_plane[pipe][i]);
> > - }
> > -
> > - skl_ddb_entry_write(dev_priv, CUR_BUF_CFG(pipe),
> > - ÂÂÂÂ&new->ddb.plane[pipe][PLANE_CURSOR]);
> > - }
> > + skl_ddb_entry_write(dev_priv, CUR_BUF_CFG(pipe),
> > + ÂÂÂÂ&wm->ddb.plane[pipe][PLANE_CURSOR]);
> > Â}
> > Â
> > -/*
> > - * When setting up a new DDB allocation arrangement, we need to correctly
> > - * sequence the times at which the new allocations for the pipes are taken
> > into
> > - * account or we'll have pipes fetching from space previously allocated to
> > - * another pipe.
> > - *
> > - * Roughly the sequence looks like:
> > - *ÂÂ1. re-allocate the pipe(s) with the allocation being reduced and not
> > - *ÂÂÂÂÂoverlapping with a previous light-up pipe (another way to put it is:
> > - *ÂÂÂÂÂpipes with their new allocation strickly included into their old
> > ones).
> > - *ÂÂ2. re-allocate the other pipes that get their allocation reduced
> > - *ÂÂ3. allocate the pipes having their allocation increased
> > - *
> > - * Steps 1. and 2. are here to take care of the following case:
> > - * - Initially DDB looks like this:
> > - *ÂÂÂÂÂ|ÂÂÂBÂÂÂÂ|ÂÂÂCÂÂÂÂ|
> > - * - enable pipe A.
> > - * - pipe B has a reduced DDB allocation that overlaps with the old pipe C
> > - *ÂÂÂallocation
> > - *ÂÂÂÂÂ|ÂÂAÂÂ|ÂÂBÂÂ|ÂÂCÂÂ|
> > - *
> > - * We need to sequence the re-allocation: C, B, A (and not B, C, A).
> > - */
> > -
> > -static void
> > -skl_wm_flush_pipe(struct drm_i915_private *dev_priv, enum pipe pipe, int
> > pass)
> > +static bool
> > +skl_ddb_allocation_equals(const struct skl_ddb_allocation *old,
> > + ÂÂconst struct skl_ddb_allocation *new,
> > + ÂÂenum pipe pipe)
> > Â{
> > - int plane;
> > -
> > - DRM_DEBUG_KMS("flush pipe %c (pass %d)\n", pipe_name(pipe), pass);
> > -
> > - for_each_plane(dev_priv, pipe, plane) {
> > - I915_WRITE(PLANE_SURF(pipe, plane),
> > - ÂÂÂI915_READ(PLANE_SURF(pipe, plane)));
> > - }
> > - I915_WRITE(CURBASE(pipe), I915_READ(CURBASE(pipe)));
> > + return new->pipe[pipe].start == old->pipe[pipe].start &&
> > + ÂÂÂÂÂÂÂnew->pipe[pipe].end == old->pipe[pipe].end;
> > Â}
> > Â
> > Âstatic bool
> > -skl_ddb_allocation_included(const struct skl_ddb_allocation *old,
> > +skl_ddb_allocation_overlaps(struct drm_atomic_state *state,
> > + ÂÂÂÂconst struct skl_ddb_allocation *old,
> > Â ÂÂÂÂconst struct skl_ddb_allocation *new,
> > Â ÂÂÂÂenum pipe pipe)
> > Â{
> > - uint16_t old_size, new_size;
> > -
> > - old_size = skl_ddb_entry_size(&old->pipe[pipe]);
> > - new_size = skl_ddb_entry_size(&new->pipe[pipe]);
> > -
> > - return old_size != new_size &&
> > - ÂÂÂÂÂÂÂnew->pipe[pipe].start >= old->pipe[pipe].start &&
> > - ÂÂÂÂÂÂÂnew->pipe[pipe].end <= old->pipe[pipe].end;
> > -}
> > -
> > -static void skl_flush_wm_values(struct drm_i915_private *dev_priv,
> > - struct skl_wm_values *new_values)
> > -{
> > - struct drm_device *dev = &dev_priv->drm;
> > - struct skl_ddb_allocation *cur_ddb, *new_ddb;
> > - bool reallocated[I915_MAX_PIPES] = {};
> > - struct intel_crtc *crtc;
> > - enum pipe pipe;
> > -
> > - new_ddb = &new_values->ddb;
> > - cur_ddb = &dev_priv->wm.skl_hw.ddb;
> > -
> > - /*
> > - Â* First pass: flush the pipes with the new allocation contained
> > into
> > - Â* the old space.
> > - Â*
> > - Â* We'll wait for the vblank on those pipes to ensure we can safely
> > - Â* re-allocate the freed space without this pipe fetching from it.
> > - Â*/
> > - for_each_intel_crtc(dev, crtc) {
> > - if (!crtc->active)
> > - continue;
> > -
> > - pipe = crtc->pipe;
> > -
> > - if (!skl_ddb_allocation_included(cur_ddb, new_ddb, pipe))
> > - continue;
> > -
> > - skl_wm_flush_pipe(dev_priv, pipe, 1);
> > - intel_wait_for_vblank(dev, pipe);
> > -
> > - reallocated[pipe] = true;
> > - }
> > -
> > -
> > - /*
> > - Â* Second pass: flush the pipes that are having their allocation
> > - Â* reduced, but overlapping with a previous allocation.
> > - Â*
> > - Â* Here as well we need to wait for the vblank to make sure the
> > freed
> > - Â* space is not used anymore.
> > - Â*/
> > - for_each_intel_crtc(dev, crtc) {
> > - if (!crtc->active)
> > - continue;
> > -
> > - pipe = crtc->pipe;
> > -
> > - if (reallocated[pipe])
> > - continue;
> > -
> > - if (skl_ddb_entry_size(&new_ddb->pipe[pipe]) <
> > - ÂÂÂÂskl_ddb_entry_size(&cur_ddb->pipe[pipe])) {
> > - skl_wm_flush_pipe(dev_priv, pipe, 2);
> > - intel_wait_for_vblank(dev, pipe);
> > - reallocated[pipe] = true;
> > - }
> > - }
> > -
> > - /*
> > - Â* Third pass: flush the pipes that got more space allocated.
> > - Â*
> > - Â* We don't need to actively wait for the update here, next vblank
> > - Â* will just get more DDB space with the correct WM values.
> > - Â*/
> > - for_each_intel_crtc(dev, crtc) {
> > - if (!crtc->active)
> > - continue;
> > + struct drm_device *dev = state->dev;
> > + struct intel_crtc *intel_crtc;
> > + enum pipe otherp;
> > Â
> > - pipe = crtc->pipe;
> > + for_each_intel_crtc(dev, intel_crtc) {
> > + otherp = intel_crtc->pipe;
> > Â
> > Â /*
> > - Â* At this point, only the pipes more space than before are
> > - Â* left to re-allocate.
> > + Â* When checking for overlaps, we don't want to:
> > + Â*ÂÂ- Compare against ourselves
> > + Â*ÂÂ- Compare against pipes that will be disabled in step 0
> > + Â*ÂÂ- Compare against pipes that won't be enabled until
> > step 3
> > Â Â*/
> > - if (reallocated[pipe])
> > + if (otherp == pipe || !new->pipe[otherp].end ||
> > + ÂÂÂÂ!old->pipe[otherp].end)
> > Â continue;
> > Â
> > - skl_wm_flush_pipe(dev_priv, pipe, 3);
> > + if ((new->pipe[pipe].start >= old->pipe[otherp].start &&
> > + ÂÂÂÂÂnew->pipe[pipe].start < old->pipe[otherp].end) ||
> > + ÂÂÂÂ(old->pipe[otherp].start >= new->pipe[pipe].start &&
> > + ÂÂÂÂÂold->pipe[otherp].start < new->pipe[pipe].end))
> > + return true;
> > Â }
> > +
> > + return false;
> > Â}
> > Â
> > Âstatic int skl_update_pipe_wm(struct drm_crtc_state *cstate,
> > @@ -4038,8 +3924,10 @@ skl_compute_ddb(struct drm_atomic_state *state)
> > Â struct drm_device *dev = state->dev;
> > Â struct drm_i915_private *dev_priv = to_i915(dev);
> > Â struct intel_atomic_state *intel_state =
> > to_intel_atomic_state(state);
> > + struct intel_crtc_state *cstate;
> > Â struct intel_crtc *intel_crtc;
> > - struct skl_ddb_allocation *ddb = &intel_state->wm_results.ddb;
> > + struct skl_ddb_allocation *old_ddb = &dev_priv->wm.skl_hw.ddb;
> > + struct skl_ddb_allocation *new_ddb = &intel_state->wm_results.ddb;
> > Â uint32_t realloc_pipes = pipes_modified(state);
> > Â int ret;
> > Â
> > @@ -4071,13 +3959,11 @@ skl_compute_ddb(struct drm_atomic_state *state)
> > Â }
> > Â
> > Â for_each_intel_crtc_mask(dev, intel_crtc, realloc_pipes) {
> > - struct intel_crtc_state *cstate;
> > -
> > Â cstate = intel_atomic_get_crtc_state(state, intel_crtc);
> > Â if (IS_ERR(cstate))
> > Â return PTR_ERR(cstate);
> > Â
> > - ret = skl_allocate_pipe_ddb(cstate, ddb);
> > + ret = skl_allocate_pipe_ddb(cstate, new_ddb);
> > Â if (ret)
> > Â return ret;
> > Â
> > @@ -4086,6 +3972,73 @@ skl_compute_ddb(struct drm_atomic_state *state)
> > Â return ret;
> > Â }
> > Â
> > + /*
> > + Â* When setting up a new DDB allocation arrangement, we need to
> > + Â* correctly sequence the times at which the new allocations for
> > the
> > + Â* pipes are taken into account or we'll have pipes fetching from
> > space
> > + Â* previously allocated to another pipe.
> > + Â*
> > + Â* Roughly the final sequence we want looks like this:
> > + Â*ÂÂ1. Disable any pipes we're not going to be using anymore
> > + Â*ÂÂ2. Reallocate all of the active pipes whose new ddb allocations
> > + Â*ÂÂwon't overlap with another active pipe's ddb allocation.
> > + Â*ÂÂ3. Reallocate remaining active pipes, if any.
> > + Â*ÂÂ4. Enable any new pipes, if any.
> > + Â*
> > + Â* Example:
> > + Â* Initially DDB looks like this:
> > + Â*ÂÂÂ|ÂÂÂBÂÂÂÂ|ÂÂÂCÂÂÂÂ|
> > + Â* And the final DDB should look like this:
> > + Â*ÂÂÂ|ÂÂBÂÂ|ÂÂCÂÂ|ÂÂAÂÂ|
> > + Â*
> > + Â* 1. We're not disabling any pipes, so do nothing on this step.
> > + Â* 2. Pipe B's new allocation wouldn't overlap with pipe C, however
> > + Â* pipe C's new allocation does overlap with pipe B's current
> > + Â* allocation. Reallocate B first so the DDB looks like this:
> > + Â*ÂÂÂ|ÂÂBÂÂ|xx|ÂÂÂCÂÂÂÂ|
> > + Â* 3. Now we can safely reallocate pipe C to it's new location:
> > + Â*ÂÂÂ|ÂÂBÂÂ|ÂÂCÂÂ|xxxxx|
> > + Â* 4. Enable any remaining pipes, in this case A
> > + Â*ÂÂÂ|ÂÂBÂÂ|ÂÂCÂÂ|ÂÂAÂÂ|
> > + Â*
> > + Â* As well, between every pipe reallocation we have to wait for a
> > + Â* vblank on the pipe so that we ensure it's new allocation has
> > taken
> > + Â* effect by the time we start moving the next pipe. This can be
> > + Â* skipped on the last step we need to perform, which is why we
> > keep
> > + Â* track of that information here. For example, if we've
> > reallocated
> > + Â* all the pipes that need changing by the time we reach step 3, we
> > can
> > + Â* finish without waiting for the pipes we changed in step 3 to
> > update.
> > + Â*/
> > + for_each_intel_crtc_mask(dev, intel_crtc, realloc_pipes) {
> > + enum pipe pipe = intel_crtc->pipe;
> > + enum skl_ddb_step step;
> > +
> > + cstate = intel_atomic_get_crtc_state(state, intel_crtc);
> > + if (IS_ERR(cstate))
> > + return PTR_ERR(cstate);
> > +
> > + /* Step 1: Pipes we're disabling / haven't changed */
> > + if (skl_ddb_allocation_equals(old_ddb, new_ddb, pipe) ||
> > + ÂÂÂÂnew_ddb->pipe[pipe].end == 0) {
> > + step = SKL_DDB_STEP_NONE;
> > + /* Step 2-3: Active pipes we're reallocating */
> > + } else if (old_ddb->pipe[pipe].end != 0) {
> > + if (skl_ddb_allocation_overlaps(state, old_ddb,
> > new_ddb,
> > + pipe))
> > + step = SKL_DDB_STEP_OVERLAP;
> > + else
> > + step = SKL_DDB_STEP_NO_OVERLAP;
> > + /* Step 4: Pipes we're enabling */
> > + } else {
> > + step = SKL_DDB_STEP_FINAL;
> > + }
> > +
> > + cstate->wm.skl.ddb_realloc = step;
> > +
> > + if (step > intel_state->last_ddb_step)
> > + intel_state->last_ddb_step = step;
> > + }
> > +
> > Â return 0;
> > Â}
> > Â
> > @@ -4110,10 +4063,13 @@ skl_copy_wm_for_pipe(struct skl_wm_values *dst,
> > Âstatic int
> > Âskl_compute_wm(struct drm_atomic_state *state)
> > Â{
> > + struct drm_i915_private *dev_priv = to_i915(state->dev);
> > Â struct drm_crtc *crtc;
> > Â struct drm_crtc_state *cstate;
> > Â struct intel_atomic_state *intel_state =
> > to_intel_atomic_state(state);
> > Â struct skl_wm_values *results = &intel_state->wm_results;
> > + struct skl_ddb_allocation *old_ddb = &dev_priv->wm.skl_hw.ddb;
> > + struct skl_ddb_allocation *new_ddb = &results->ddb;
> > Â struct skl_pipe_wm *pipe_wm;
> > Â bool changed = false;
> > Â int ret, i;
> > @@ -4152,7 +4108,10 @@ skl_compute_wm(struct drm_atomic_state *state)
> > Â struct intel_crtc *intel_crtc = to_intel_crtc(crtc);
> > Â struct intel_crtc_state *intel_cstate =
> > Â to_intel_crtc_state(cstate);
> > + enum skl_ddb_step step;
> > + enum pipe pipe;
> > Â
> > + pipe = intel_crtc->pipe;
> > Â pipe_wm = &intel_cstate->wm.skl.optimal;
> > Â ret = skl_update_pipe_wm(cstate, &results->ddb, pipe_wm,
> > Â Â&changed);
> > @@ -4167,7 +4126,18 @@ skl_compute_wm(struct drm_atomic_state *state)
> > Â continue;
> > Â
> > Â intel_cstate->update_wm_pre = true;
> > + step = intel_cstate->wm.skl.ddb_realloc;
> > Â skl_compute_wm_results(crtc->dev, pipe_wm, results,
> > intel_crtc);
> > +
> > + if (!skl_ddb_entry_equal(&old_ddb->pipe[pipe],
> > + Â&new_ddb->pipe[pipe])) {
> > + DRM_DEBUG_KMS(
> > + ÂÂÂÂ"DDB changes for [CRTC:%d:pipe %c]: (%3d - %3d)
> > -> (%3d - %3d) on step %d\n",
> > + ÂÂÂÂintel_crtc->base.base.id, pipe_name(pipe),
> > + ÂÂÂÂold_ddb->pipe[pipe].start, old_ddb-
> > >pipe[pipe].end,
> > + ÂÂÂÂnew_ddb->pipe[pipe].start, new_ddb-
> > >pipe[pipe].end,
> > + ÂÂÂÂstep);
> > + }
> > Â }
> > Â
> > Â return 0;
> > @@ -4191,8 +4161,20 @@ static void skl_update_wm(struct drm_crtc *crtc)
> > Â
> > Â mutex_lock(&dev_priv->wm.wm_mutex);
> > Â
> > - skl_write_wm_values(dev_priv, results);
> > - skl_flush_wm_values(dev_priv, results);
> > + /*
> > + Â* If this pipe isn't active already, we're going to be enabling it
> > + Â* very soon. Since it's safe to update these while the pipe's shut
> > off,
> > + Â* just do so here. Already active pipes will have their watermarks
> > + Â* updated once we update their planes.
> > + Â*/
> > + if (!intel_crtc->active) {
> > + int plane;
> > +
> > + for (plane = 0; plane < intel_num_planes(intel_crtc);
> > plane++)
> > + skl_write_plane_wm(intel_crtc, results, plane);
> > +
> > + skl_write_cursor_wm(intel_crtc, results);
> > + }
> > Â
> > Â /*
> > Â Â* Store the new configuration (but only for the pipes that have
> > --Â
> > 2.7.4
>