From: Stanislav Lisovskiy <stanislav.lisovskiy@xxxxxxxxx> Starting from xe3, hw now is capable of switching automatically to min ddb allocation(not using any extra blocks) or interim SAGV-adjusted allocation in case if async flip is used. For that purpose there is now additional register, where correspodent values have to be programmed. Bspec: 69880, 72053 Signed-off-by: Stanislav Lisovskiy <stanislav.lisovskiy@xxxxxxxxx> Signed-off-by: Vinod Govindapillai <vinod.govindapillai@xxxxxxxxx> --- .../gpu/drm/i915/display/intel_atomic_plane.c | 9 ++ .../drm/i915/display/intel_display_types.h | 8 ++ .../drm/i915/display/skl_universal_plane.c | 31 +++++++ .../i915/display/skl_universal_plane_regs.h | 13 +++ drivers/gpu/drm/i915/display/skl_watermark.c | 85 +++++++++++++++++-- 5 files changed, 140 insertions(+), 6 deletions(-) diff --git a/drivers/gpu/drm/i915/display/intel_atomic_plane.c b/drivers/gpu/drm/i915/display/intel_atomic_plane.c index 2c8fae8de4da..7940cb911889 100644 --- a/drivers/gpu/drm/i915/display/intel_atomic_plane.c +++ b/drivers/gpu/drm/i915/display/intel_atomic_plane.c @@ -213,6 +213,15 @@ use_min_ddb(const struct intel_crtc_state *crtc_state, { struct intel_display *display = to_intel_display(plane); + /* + * For xe3 onwards this feature is implemented in + * hardware, so no need to force relative data rate to 0, + * we will update a specific register with min_ddb without + * extra blocks. + */ + if (DISPLAY_VER(display) >= 30) + return false; + return DISPLAY_VER(display) >= 13 && crtc_state->uapi.async_flip && plane->async_flip; diff --git a/drivers/gpu/drm/i915/display/intel_display_types.h b/drivers/gpu/drm/i915/display/intel_display_types.h index d2b68505f088..c0548db0061c 100644 --- a/drivers/gpu/drm/i915/display/intel_display_types.h +++ b/drivers/gpu/drm/i915/display/intel_display_types.h @@ -770,6 +770,7 @@ struct skl_wm_level { bool enable; bool ignore_lines; bool can_sagv; + bool auto_min_ddb_allowed; }; struct skl_plane_wm { @@ -863,6 +864,13 @@ struct intel_crtc_wm_state { struct skl_ddb_entry plane_ddb[I915_MAX_PLANES]; /* pre-icl: for planar Y */ struct skl_ddb_entry plane_ddb_y[I915_MAX_PLANES]; + + /* + * xe3: Minimum amount of display blocks and minimum + * sagv allocation required for async flip + */ + struct skl_ddb_entry plane_min_ddb[I915_MAX_PLANES]; + struct skl_ddb_entry plane_interim_ddb[I915_MAX_PLANES]; } skl; struct { diff --git a/drivers/gpu/drm/i915/display/skl_universal_plane.c b/drivers/gpu/drm/i915/display/skl_universal_plane.c index 038ca2ec5d7a..69d5ca74c594 100644 --- a/drivers/gpu/drm/i915/display/skl_universal_plane.c +++ b/drivers/gpu/drm/i915/display/skl_universal_plane.c @@ -715,6 +715,26 @@ static u32 skl_plane_ddb_reg_val(const struct skl_ddb_entry *entry) PLANE_BUF_START(entry->start); } +static u32 ptl_plane_min_ddb_reg_val(const struct skl_ddb_entry *min_ddb_entry, + const struct skl_ddb_entry *interim_ddb_entry) +{ + u32 val = 0; + + if (min_ddb_entry->end) { + val |= PLANE_AUTO_MIN_DBUF_EN; + val |= REG_FIELD_PREP(PLANE_MIN_DDB_BLOCKS_MASK, + min_ddb_entry->end - min_ddb_entry->start); + } + + if (interim_ddb_entry->end) { + val |= PLANE_AUTO_MIN_DBUF_EN; + val |= REG_FIELD_PREP(PLANE_INTERIM_DDB_BLOCKS_MASK, + interim_ddb_entry->end - interim_ddb_entry->start); + } + + return val; +} + static u32 skl_plane_wm_reg_val(const struct skl_wm_level *level) { u32 val = 0; @@ -723,6 +743,9 @@ static u32 skl_plane_wm_reg_val(const struct skl_wm_level *level) val |= PLANE_WM_EN; if (level->ignore_lines) val |= PLANE_WM_IGNORE_LINES; + if (level->auto_min_ddb_allowed) + val |= PLANE_WM_AUTO_MIN_ALLOC_EN; + val |= REG_FIELD_PREP(PLANE_WM_BLOCKS_MASK, level->blocks); val |= REG_FIELD_PREP(PLANE_WM_LINES_MASK, level->lines); @@ -742,6 +765,10 @@ static void skl_write_plane_wm(struct intel_dsb *dsb, &crtc_state->wm.skl.plane_ddb[plane_id]; const struct skl_ddb_entry *ddb_y = &crtc_state->wm.skl.plane_ddb_y[plane_id]; + const struct skl_ddb_entry *min_ddb = + &crtc_state->wm.skl.plane_min_ddb[plane_id]; + const struct skl_ddb_entry *interim_ddb = + &crtc_state->wm.skl.plane_interim_ddb[plane_id]; int level; for (level = 0; level < i915->display.wm.num_levels; level++) @@ -766,6 +793,10 @@ static void skl_write_plane_wm(struct intel_dsb *dsb, if (DISPLAY_VER(i915) < 11) intel_de_write_dsb(display, dsb, PLANE_NV12_BUF_CFG(pipe, plane_id), skl_plane_ddb_reg_val(ddb_y)); + + if (DISPLAY_VER(display) >= 30) + intel_de_write_dsb(display, dsb, PLANE_MIN_BUF_CFG(pipe, plane_id), + ptl_plane_min_ddb_reg_val(min_ddb, interim_ddb)); } static void diff --git a/drivers/gpu/drm/i915/display/skl_universal_plane_regs.h b/drivers/gpu/drm/i915/display/skl_universal_plane_regs.h index ff31a00d511e..65a5482fae60 100644 --- a/drivers/gpu/drm/i915/display/skl_universal_plane_regs.h +++ b/drivers/gpu/drm/i915/display/skl_universal_plane_regs.h @@ -322,6 +322,7 @@ _PLANE_WM_2_A_0, _PLANE_WM_2_B_0) #define PLANE_WM_EN REG_BIT(31) #define PLANE_WM_IGNORE_LINES REG_BIT(30) +#define PLANE_WM_AUTO_MIN_ALLOC_EN REG_BIT(29) #define PLANE_WM_LINES_MASK REG_GENMASK(26, 14) #define PLANE_WM_BLOCKS_MASK REG_GENMASK(11, 0) @@ -373,12 +374,24 @@ #define PLANE_BUF_CFG(pipe, plane) _MMIO_SKL_PLANE((pipe), (plane), \ _PLANE_BUF_CFG_1_A, _PLANE_BUF_CFG_1_B, \ _PLANE_BUF_CFG_2_A, _PLANE_BUF_CFG_2_B) +#define _PLANE_MIN_BUF_CFG_1_A 0x70274 +#define _PLANE_MIN_BUF_CFG_2_A 0x70374 +#define _PLANE_MIN_BUF_CFG_1_B 0x71274 +#define _PLANE_MIN_BUF_CFG_2_B 0x71374 +#define PLANE_MIN_BUF_CFG(pipe, plane) _MMIO_SKL_PLANE((pipe), (plane), \ + _PLANE_MIN_BUF_CFG_1_A, _PLANE_MIN_BUF_CFG_1_B, \ + _PLANE_MIN_BUF_CFG_2_A, _PLANE_MIN_BUF_CFG_2_B) + /* skl+: 10 bits, icl+ 11 bits, adlp+ 12 bits */ #define PLANE_BUF_END_MASK REG_GENMASK(27, 16) #define PLANE_BUF_END(end) REG_FIELD_PREP(PLANE_BUF_END_MASK, (end)) #define PLANE_BUF_START_MASK REG_GENMASK(11, 0) #define PLANE_BUF_START(start) REG_FIELD_PREP(PLANE_BUF_START_MASK, (start)) +#define PLANE_AUTO_MIN_DBUF_EN REG_BIT(31) +#define PLANE_MIN_DDB_BLOCKS_MASK REG_GENMASK(27, 16) +#define PLANE_INTERIM_DDB_BLOCKS_MASK REG_GENMASK(11, 0) + /* tgl+ */ #define _SEL_FETCH_PLANE_CTL_1_A 0x70890 #define _SEL_FETCH_PLANE_CTL_2_A 0x708b0 diff --git a/drivers/gpu/drm/i915/display/skl_watermark.c b/drivers/gpu/drm/i915/display/skl_watermark.c index d961d01343b3..4e6433374e0d 100644 --- a/drivers/gpu/drm/i915/display/skl_watermark.c +++ b/drivers/gpu/drm/i915/display/skl_watermark.c @@ -797,7 +797,9 @@ skl_ddb_get_hw_plane_state(struct intel_display *display, const enum pipe pipe, const enum plane_id plane_id, struct skl_ddb_entry *ddb, - struct skl_ddb_entry *ddb_y) + struct skl_ddb_entry *ddb_y, + struct skl_ddb_entry *min_ddb, + struct skl_ddb_entry *interim_ddb) { u32 val; @@ -811,6 +813,17 @@ skl_ddb_get_hw_plane_state(struct intel_display *display, val = intel_de_read(display, PLANE_BUF_CFG(pipe, plane_id)); skl_ddb_entry_init_from_hw(ddb, val); + if (DISPLAY_VER(display) >= 30) { + val = intel_de_read(display, PLANE_MIN_BUF_CFG(pipe, plane_id)); + + skl_ddb_entry_init(min_ddb, 0, + REG_FIELD_GET(PLANE_MIN_DDB_BLOCKS_MASK, + val)); + skl_ddb_entry_init(interim_ddb, 0, + REG_FIELD_GET(PLANE_INTERIM_DDB_BLOCKS_MASK, + val)); + } + if (DISPLAY_VER(display) >= 11) return; @@ -820,7 +833,9 @@ skl_ddb_get_hw_plane_state(struct intel_display *display, static void skl_pipe_ddb_get_hw_state(struct intel_crtc *crtc, struct skl_ddb_entry *ddb, - struct skl_ddb_entry *ddb_y) + struct skl_ddb_entry *ddb_y, + struct skl_ddb_entry *min_ddb, + struct skl_ddb_entry *interim_ddb) { struct drm_i915_private *i915 = to_i915(crtc->base.dev); enum intel_display_power_domain power_domain; @@ -837,7 +852,9 @@ static void skl_pipe_ddb_get_hw_state(struct intel_crtc *crtc, skl_ddb_get_hw_plane_state(&i915->display, pipe, plane_id, &ddb[plane_id], - &ddb_y[plane_id]); + &ddb_y[plane_id], + &min_ddb[plane_id], + &interim_ddb[plane_id]); intel_display_power_put(i915, power_domain, wakeref); } @@ -1374,7 +1391,9 @@ use_minimal_wm0_only(const struct intel_crtc_state *crtc_state, { struct intel_display *display = to_intel_display(plane); + /* Xe3 (ver >= 30) has auto minimum DDB enabled */ return DISPLAY_VER(display) >= 13 && + DISPLAY_VER(display) < 30 && crtc_state->uapi.async_flip && plane->async_flip; } @@ -1515,6 +1534,7 @@ skl_crtc_allocate_plane_ddb(struct intel_atomic_state *state, const struct intel_dbuf_state *dbuf_state = intel_atomic_get_new_dbuf_state(state); const struct skl_ddb_entry *alloc = &dbuf_state->ddb[crtc->pipe]; + struct intel_display *display = to_intel_display(state); int num_active = hweight8(dbuf_state->active_pipes); struct skl_plane_ddb_iter iter; enum plane_id plane_id; @@ -1525,6 +1545,8 @@ skl_crtc_allocate_plane_ddb(struct intel_atomic_state *state, /* Clear the partitioning for disabled planes. */ memset(crtc_state->wm.skl.plane_ddb, 0, sizeof(crtc_state->wm.skl.plane_ddb)); memset(crtc_state->wm.skl.plane_ddb_y, 0, sizeof(crtc_state->wm.skl.plane_ddb_y)); + memset(crtc_state->wm.skl.plane_min_ddb, 0, sizeof(crtc_state->wm.skl.plane_min_ddb)); + memset(crtc_state->wm.skl.plane_interim_ddb, 0, sizeof(crtc_state->wm.skl.plane_interim_ddb)); if (!crtc_state->hw.active) return 0; @@ -1597,6 +1619,10 @@ skl_crtc_allocate_plane_ddb(struct intel_atomic_state *state, &crtc_state->wm.skl.plane_ddb[plane_id]; struct skl_ddb_entry *ddb_y = &crtc_state->wm.skl.plane_ddb_y[plane_id]; + struct skl_ddb_entry *min_ddb = + &crtc_state->wm.skl.plane_min_ddb[plane_id]; + struct skl_ddb_entry *interim_ddb = + &crtc_state->wm.skl.plane_interim_ddb[plane_id]; const struct skl_plane_wm *wm = &crtc_state->wm.skl.optimal.planes[plane_id]; @@ -1612,6 +1638,20 @@ skl_crtc_allocate_plane_ddb(struct intel_atomic_state *state, } else { skl_allocate_plane_ddb(&iter, ddb, &wm->wm[level], crtc_state->rel_data_rate[plane_id]); + + /* + * xe3: Handle min_ddb and interim_ddb. Unlike the + * normal ddb allocation, min_ddb and interim_ddb config + * expects only the number of blocks from 0. The buffer + * start is found in PLANE_BUF_CFG + * Bspec: 72053 + */ + if (DISPLAY_VER(display) >= 30) { + skl_ddb_entry_init(min_ddb, 0, + wm->wm[0].min_ddb_alloc); + skl_ddb_entry_init(interim_ddb, 0, + wm->sagv.wm0.min_ddb_alloc); + } } } drm_WARN_ON(&i915->drm, iter.size != 0 || iter.data_rate != 0); @@ -1656,6 +1696,8 @@ skl_crtc_allocate_plane_ddb(struct intel_atomic_state *state, &crtc_state->wm.skl.plane_ddb[plane_id]; const struct skl_ddb_entry *ddb_y = &crtc_state->wm.skl.plane_ddb_y[plane_id]; + struct skl_ddb_entry *interim_ddb = + &crtc_state->wm.skl.plane_interim_ddb[plane_id]; struct skl_plane_wm *wm = &crtc_state->wm.skl.optimal.planes[plane_id]; @@ -1669,6 +1711,11 @@ skl_crtc_allocate_plane_ddb(struct intel_atomic_state *state, } skl_check_wm_level(&wm->sagv.wm0, ddb); + /* update the interim ddb, in case if it is changed */ + if (DISPLAY_VER(display) >= 30) + skl_ddb_entry_init(interim_ddb, 0, + wm->sagv.wm0.min_ddb_alloc); + skl_check_wm_level(&wm->sagv.trans_wm, ddb); } @@ -1747,6 +1794,7 @@ skl_compute_wm_params(const struct intel_crtc_state *crtc_state, int color_plane, unsigned int pan_x) { struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc); + struct intel_display *display = to_intel_display(crtc_state); struct drm_i915_private *i915 = to_i915(crtc->base.dev); u32 interm_pbpl; @@ -1805,7 +1853,7 @@ skl_compute_wm_params(const struct intel_crtc_state *crtc_state, wp->y_min_scanlines, wp->dbuf_block_size); - if (DISPLAY_VER(i915) >= 30) + if (DISPLAY_VER(display) >= 30) interm_pbpl += (pan_x != 0); else if (DISPLAY_VER(i915) >= 10) interm_pbpl++; @@ -1870,6 +1918,11 @@ static int skl_wm_max_lines(struct drm_i915_private *i915) return 31; } +static bool can_use_min_ddb(struct intel_display *display, int level) +{ + return DISPLAY_VER(display) >= 30 && level == 0; +} + static void skl_compute_plane_wm(const struct intel_crtc_state *crtc_state, struct intel_plane *plane, int level, @@ -1879,6 +1932,7 @@ static void skl_compute_plane_wm(const struct intel_crtc_state *crtc_state, struct skl_wm_level *result /* out */) { struct drm_i915_private *i915 = to_i915(crtc_state->uapi.crtc->dev); + struct intel_display *display = to_intel_display(crtc_state); uint_fixed_16_16_t method1, method2; uint_fixed_16_16_t selected_result; u32 blocks, lines, min_ddb_alloc = 0; @@ -2002,6 +2056,11 @@ static void skl_compute_plane_wm(const struct intel_crtc_state *crtc_state, /* Bspec says: value >= plane ddb allocation -> invalid, hence the +1 here */ result->min_ddb_alloc = max(min_ddb_alloc, blocks) + 1; result->enable = true; + /* + * For Xe3, when auto min DDB is enabled, it automatically switches to + * the wm level where this auto min ddb is enabled + */ + result->auto_min_ddb_allowed = can_use_min_ddb(display, level); if (DISPLAY_VER(i915) < 12 && i915->display.sagv.block_time_us) result->can_sagv = latency >= i915->display.sagv.block_time_us; @@ -2398,6 +2457,10 @@ static bool skl_plane_wm_equals(struct intel_display *display, */ if (!skl_wm_level_equals(&wm1->wm[level], &wm2->wm[level])) return false; + + if (DISPLAY_VER(display) >= 30 && + wm1->wm[level].auto_min_ddb_allowed != wm2->wm[level].auto_min_ddb_allowed) + return false; } return skl_wm_level_equals(&wm1->trans_wm, &wm2->trans_wm) && @@ -2929,6 +2992,8 @@ static void skl_wm_level_from_reg_val(struct intel_display *display, level->ignore_lines = val & PLANE_WM_IGNORE_LINES; level->blocks = REG_FIELD_GET(PLANE_WM_BLOCKS_MASK, val); level->lines = REG_FIELD_GET(PLANE_WM_LINES_MASK, val); + level->auto_min_ddb_allowed = DISPLAY_VER(display) >= 30 && + val & PLANE_WM_AUTO_MIN_ALLOC_EN; } static void skl_pipe_wm_get_hw_state(struct intel_crtc *crtc, @@ -3014,12 +3079,17 @@ static void skl_wm_get_hw_state(struct drm_i915_private *i915) &crtc_state->wm.skl.plane_ddb[plane_id]; struct skl_ddb_entry *ddb_y = &crtc_state->wm.skl.plane_ddb_y[plane_id]; + struct skl_ddb_entry *min_ddb = + &crtc_state->wm.skl.plane_min_ddb[plane_id]; + struct skl_ddb_entry *interim_ddb = + &crtc_state->wm.skl.plane_interim_ddb[plane_id]; if (!crtc_state->hw.active) continue; skl_ddb_get_hw_plane_state(display, crtc->pipe, - plane_id, ddb, ddb_y); + plane_id, ddb, ddb_y, + min_ddb, interim_ddb); skl_ddb_entry_union(&dbuf_state->ddb[pipe], ddb); skl_ddb_entry_union(&dbuf_state->ddb[pipe], ddb_y); @@ -3136,6 +3206,8 @@ void intel_wm_state_verify(struct intel_atomic_state *state, struct skl_hw_state { struct skl_ddb_entry ddb[I915_MAX_PLANES]; struct skl_ddb_entry ddb_y[I915_MAX_PLANES]; + struct skl_ddb_entry min_ddb[I915_MAX_PLANES]; + struct skl_ddb_entry interim_ddb[I915_MAX_PLANES]; struct skl_pipe_wm wm; } *hw; const struct skl_pipe_wm *sw_wm = &new_crtc_state->wm.skl.optimal; @@ -3152,7 +3224,8 @@ void intel_wm_state_verify(struct intel_atomic_state *state, skl_pipe_wm_get_hw_state(crtc, &hw->wm); - skl_pipe_ddb_get_hw_state(crtc, hw->ddb, hw->ddb_y); + skl_pipe_ddb_get_hw_state(crtc, hw->ddb, hw->ddb_y, hw->min_ddb, + hw->interim_ddb); hw_enabled_slices = intel_enabled_dbuf_slices_mask(display); -- 2.34.1