On Thu, Mar 07, 2024 at 12:05:42PM -0500, Frank Li wrote: > On Thu, Mar 07, 2024 at 05:57:29PM +0800, Xu Yang wrote: > > i.MX95 has a DDR PMU which is almostly same as i.MX93, it now supports > > read beat and write beat filter capabilities. This will add support for > > i.MX95 and enhance the driver to support specific filter handling for it. > > > > Usage: > > > > For read beat: > > ~# perf stat -a -I 1000 -e imx9_ddr0/eddrtq_pm_rd_beat_filt2,axi_mask=ID_MASK,axi_id=ID/ > > ~# perf stat -a -I 1000 -e imx9_ddr0/eddrtq_pm_rd_beat_filt1,axi_mask=ID_MASK,axi_id=ID/ > > ~# perf stat -a -I 1000 -e imx9_ddr0/eddrtq_pm_rd_beat_filt0,axi_mask=ID_MASK,axi_id=ID/ > > eg: For edma2: perf stat -a -I 1000 -e imx9_ddr0/eddrtq_pm_rd_beat_filt0,axi_mask=0x00f,axi_id=0x00c/ > > > > For write beat: > > ~# perf stat -a -I 1000 -e imx9_ddr0/eddrtq_pm_wr_beat_filt,axi_mask=ID_MASK,axi_id=ID/ > > eg: For edma2: perf stat -a -I 1000 -e imx9_ddr0/eddrtq_pm_wr_beat_filt,axi_mask=0x00f,axi_id=0x00c/ > > > > Signed-off-by: Xu Yang <xu.yang_2@xxxxxxx> > > > > --- > > Changes in v2: > > - put soc spefific axi filter events to drvdata according > > to franks suggestions. > > - adjust pmcfg axi_id and axi_mask config > > Changes in v3: > > - no changes > > Changes in v4: > > - only contain imx95 parts > > Changes in v5: > > - improve imx95_ddr_perf_monitor_config() > > - use write_relaxed to pair read_relaxed > > Changes in v6: > > - no changes > > --- > > drivers/perf/fsl_imx9_ddr_perf.c | 93 ++++++++++++++++++++++++++++++-- > > 1 file changed, 90 insertions(+), 3 deletions(-) > > > > diff --git a/drivers/perf/fsl_imx9_ddr_perf.c b/drivers/perf/fsl_imx9_ddr_perf.c > > index 52234b97d0cb..a91267e2f5d8 100644 > > --- a/drivers/perf/fsl_imx9_ddr_perf.c > > +++ b/drivers/perf/fsl_imx9_ddr_perf.c > > @@ -17,9 +17,19 @@ > > #define MX93_PMCFG1_RD_BT_FILT_EN BIT(29) > > #define MX93_PMCFG1_ID_MASK GENMASK(17, 0) > > > > +#define MX95_PMCFG1_WR_BEAT_FILT_EN BIT(31) > > +#define MX95_PMCFG1_RD_BEAT_FILT_EN BIT(30) > > + > > #define PMCFG2 0x04 > > #define MX93_PMCFG2_ID GENMASK(17, 0) > > > > +#define PMCFG3 0x08 > > +#define PMCFG4 0x0C > > +#define PMCFG5 0x10 > > +#define PMCFG6 0x14 > > +#define MX95_PMCFG_ID_MASK GENMASK(9, 0) > > +#define MX95_PMCFG_ID GENMASK(25, 16) > > + > > /* Global control register affects all counters and takes priority over local control registers */ > > #define PMGC0 0x40 > > /* Global control register bits */ > > @@ -77,13 +87,23 @@ static const struct imx_ddr_devtype_data imx93_devtype_data = { > > .identifier = "imx93", > > }; > > > > +static const struct imx_ddr_devtype_data imx95_devtype_data = { > > + .identifier = "imx95", > > +}; > > + > > static inline bool is_imx93(struct ddr_pmu *pmu) > > { > > return pmu->devtype_data == &imx93_devtype_data; > > } > > > > +static inline bool is_imx95(struct ddr_pmu *pmu) > > +{ > > + return pmu->devtype_data == &imx95_devtype_data; > > +} > > + > > static const struct of_device_id imx_ddr_pmu_dt_ids[] = { > > - {.compatible = "fsl,imx93-ddr-pmu", .data = &imx93_devtype_data}, > > + { .compatible = "fsl,imx93-ddr-pmu", .data = &imx93_devtype_data }, > > + { .compatible = "fsl,imx95-ddr-pmu", .data = &imx95_devtype_data }, > > { /* sentinel */ } > > }; > > MODULE_DEVICE_TABLE(of, imx_ddr_pmu_dt_ids); > > @@ -192,6 +212,7 @@ static struct attribute *ddr_perf_events_attrs[] = { > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_7, ID(2, 71)), > > IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_empty, ID(2, 72)), > > IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_trans_filt, ID(2, 73)), /* imx93 specific*/ > > + IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pm_wr_beat_filt, ID(2, 73)), /* imx95 specific*/ > > > > /* counter3 specific events */ > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_0, ID(3, 64)), > > @@ -204,6 +225,7 @@ static struct attribute *ddr_perf_events_attrs[] = { > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_7, ID(3, 71)), > > IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_full, ID(3, 72)), > > IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pm_wr_trans_filt, ID(3, 73)), /* imx93 specific*/ > > + IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt2, ID(3, 73)), /* imx95 specific*/ > > > > /* counter4 specific events */ > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_0, ID(4, 64)), > > @@ -216,6 +238,7 @@ static struct attribute *ddr_perf_events_attrs[] = { > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_7, ID(4, 71)), > > IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_rdq2_rmw, ID(4, 72)), > > IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt, ID(4, 73)), /* imx93 specific*/ > > + IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt1, ID(4, 73)), /* imx95 specific*/ > > > > /* counter5 specific events */ > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_0, ID(5, 64)), > > @@ -227,6 +250,7 @@ static struct attribute *ddr_perf_events_attrs[] = { > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_6, ID(5, 70)), > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_7, ID(5, 71)), > > IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_rdq1, ID(5, 72)), > > + IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt0, ID(5, 73)), /* imx95 specific*/ > > > > /* counter6 specific events */ > > IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_end_0, ID(6, 64)), > > @@ -263,6 +287,13 @@ ddr_perf_events_attrs_is_visible(struct kobject *kobj, > > !is_imx93(ddr_pmu)) > > return 0; > > > > + if ((!strcmp(attr->name, "eddrtq_pm_wr_beat_filt") || > > + !strcmp(attr->name, "eddrtq_pm_rd_beat_filt2") || > > + !strcmp(attr->name, "eddrtq_pm_rd_beat_filt1") || > > + !strcmp(attr->name, "eddrtq_pm_rd_beat_filt0")) && > > + !is_imx95(ddr_pmu)) > > + return 0; > > + > > return attr->mode; > > } > > > > @@ -434,6 +465,57 @@ static void imx93_ddr_perf_monitor_config(struct ddr_pmu *pmu, int event, > > writel_relaxed(pmcfg2, pmu->base + PMCFG2); > > } > > > > +static void imx95_ddr_perf_monitor_config(struct ddr_pmu *pmu, int event, > > + int counter, int axi_id, int axi_mask) > > +{ > > + u32 pmcfg1, pmcfg, offset = 0; > > + > > + pmcfg1 = readl_relaxed(pmu->base + PMCFG1); > > + > > + if (event == 73) { > > + switch (counter) { > > + case 2: > > + pmcfg1 |= MX95_PMCFG1_WR_BEAT_FILT_EN; > > + offset = PMCFG3; > > + break; > > + case 3: > > + pmcfg1 |= MX95_PMCFG1_RD_BEAT_FILT_EN; > > + offset = PMCFG4; > > + break; > > + case 4: > > + pmcfg1 |= MX95_PMCFG1_RD_BEAT_FILT_EN; > > + offset = PMCFG5; > > + break; > > + case 5: > > + pmcfg1 |= MX95_PMCFG1_RD_BEAT_FILT_EN; > > + offset = PMCFG6; > > + break; > > + } > > + } else { > > + switch (counter) { > > + case 2: > > + pmcfg1 &= ~MX95_PMCFG1_WR_BEAT_FILT_EN; > > + break; > > + case 3: > > + case 4: > > + case 5: > > + pmcfg1 &= ~MX95_PMCFG1_RD_BEAT_FILT_EN; > > + break; > > + } > > + } > > Look like only if event = 73, FILTER need be set. > > How about > > pmcfg1 &= ~(MX95_PMCFG1_WR_BEAT_FILT_EN | MX95_PMCFG1_RD_BEAT_FILT_EN); > if (event == 73) > switch() > ... > > So you need "else" branch. Forget this one. My code have problem. Frank > > > > + > > + writel_relaxed(pmcfg1, pmu->base + PMCFG1); > > + > > + if (offset) { > > + pmcfg = readl_relaxed(pmu->base + offset); > > + pmcfg &= ~(FIELD_PREP(MX95_PMCFG_ID_MASK, 0x3FF) | > > + FIELD_PREP(MX95_PMCFG_ID, 0x3FF)); > > + pmcfg |= (FIELD_PREP(MX95_PMCFG_ID_MASK, axi_mask) | > > + FIELD_PREP(MX95_PMCFG_ID, axi_id)); > > + writel_relaxed(pmcfg, pmu->base + offset); > > + } > > +} > > + > > static void ddr_perf_event_update(struct perf_event *event) > > { > > struct ddr_pmu *pmu = to_ddr_pmu(event->pmu); > > @@ -543,8 +625,13 @@ static int ddr_perf_event_add(struct perf_event *event, int flags) > > hwc->idx = counter; > > hwc->state |= PERF_HES_STOPPED; > > > > - /* read trans, write trans, read beat */ > > - imx93_ddr_perf_monitor_config(pmu, event_id, counter, cfg1, cfg2); > > + if (is_imx93(pmu)) > > + /* read trans, write trans, read beat */ > > + imx93_ddr_perf_monitor_config(pmu, event_id, counter, cfg1, cfg2); > > + > > + if (is_imx95(pmu)) > > + /* write beat, read beat2, read beat1, read beat */ > > + imx95_ddr_perf_monitor_config(pmu, event_id, counter, cfg1, cfg2); > > > > if (flags & PERF_EF_START) > > ddr_perf_event_start(event, flags); > > -- > > 2.34.1 > >