* [PATCH] perf/cxlpmu: Support Channel/Rank/Bank filter
@ 2026-06-11 1:04 Davidlohr Bueso
2026-06-11 1:14 ` sashiko-bot
0 siblings, 1 reply; 2+ messages in thread
From: Davidlohr Bueso @ 2026-06-11 1:04 UTC (permalink / raw)
To: jic23, will, mark.rutland
Cc: linux-cxl, linux-perf-users, Harshal Thakkar, Davidlohr Bueso
From: Harshal Thakkar <harshal.t@samsung.com>
Implement CRB filtering per CXL 4.0 8.2.7.2.2, and extend the
current filtering support beyond HDM. These filters are only for
DDR Interface events.
Placing the 32-bit CRB value at config2:32-63 leaves the
exisitng HDM value at config2:0-15 untouched and avoids needing
a new config3.
Signed-off-by: Harshal Thakkar <harshal.t@samsung.com>
Signed-off-by: Davidlohr Bueso <dave@stgolabs.net>
---
drivers/perf/cxl_pmu.c | 45 ++++++++++++++++++++++++++++++++++++++++--
1 file changed, 43 insertions(+), 2 deletions(-)
diff --git a/drivers/perf/cxl_pmu.c b/drivers/perf/cxl_pmu.c
index 68a54d97d2a8..b709b2e6c0d9 100644
--- a/drivers/perf/cxl_pmu.c
+++ b/drivers/perf/cxl_pmu.c
@@ -106,6 +106,7 @@ struct cxl_pmu_info {
int on_cpu;
struct hlist_node node;
bool filter_hdm;
+ bool filter_chan_rank_bank;
int irq;
};
@@ -142,6 +143,8 @@ static int cxl_pmu_parse_caps(struct device *dev, struct cxl_pmu_info *info)
info->num_event_capabilities = FIELD_GET(CXL_PMU_CAP_NUM_EVN_CAP_REG_SUP_MSK, val) + 1;
info->filter_hdm = FIELD_GET(CXL_PMU_CAP_FILTERS_SUP_MSK, val) & CXL_PMU_FILTER_HDM;
+ info->filter_chan_rank_bank = FIELD_GET(CXL_PMU_CAP_FILTERS_SUP_MSK, val) &
+ CXL_PMU_FILTER_CHAN_RANK_BANK;
if (FIELD_GET(CXL_PMU_CAP_INT, val))
info->irq = FIELD_GET(CXL_PMU_CAP_MSI_N_MSK, val);
else
@@ -225,6 +228,8 @@ enum {
cxl_pmu_edge_attr,
cxl_pmu_hdm_filter_en_attr,
cxl_pmu_hdm_attr,
+ cxl_pmu_crb_filter_en_attr,
+ cxl_pmu_crb_attr,
};
static struct attribute *cxl_pmu_format_attr[] = {
@@ -236,6 +241,8 @@ static struct attribute *cxl_pmu_format_attr[] = {
[cxl_pmu_edge_attr] = CXL_PMU_FORMAT_ATTR(edge, "config1:17"),
[cxl_pmu_hdm_filter_en_attr] = CXL_PMU_FORMAT_ATTR(hdm_filter_en, "config1:18"),
[cxl_pmu_hdm_attr] = CXL_PMU_FORMAT_ATTR(hdm, "config2:0-15"),
+ [cxl_pmu_crb_filter_en_attr] = CXL_PMU_FORMAT_ATTR(crb_filter_en, "config1:19"),
+ [cxl_pmu_crb_attr] = CXL_PMU_FORMAT_ATTR(crb, "config2:32-63"),
NULL
};
@@ -246,7 +253,9 @@ static struct attribute *cxl_pmu_format_attr[] = {
#define CXL_PMU_ATTR_CONFIG1_INVERT_MSK BIT(16)
#define CXL_PMU_ATTR_CONFIG1_EDGE_MSK BIT(17)
#define CXL_PMU_ATTR_CONFIG1_FILTER_EN_MSK BIT(18)
+#define CXL_PMU_ATTR_CONFIG1_CRB_FILTER_EN_MSK BIT(19)
#define CXL_PMU_ATTR_CONFIG2_HDM_MSK GENMASK(15, 0)
+#define CXL_PMU_ATTR_CONFIG2_CRB_MSK GENMASK(63, 32)
static umode_t cxl_pmu_format_is_visible(struct kobject *kobj,
struct attribute *attr, int a)
@@ -263,6 +272,11 @@ static umode_t cxl_pmu_format_is_visible(struct kobject *kobj,
attr == cxl_pmu_format_attr[cxl_pmu_hdm_attr]))
return 0;
+ if (!info->filter_chan_rank_bank &&
+ (attr == cxl_pmu_format_attr[cxl_pmu_crb_filter_en_attr] ||
+ attr == cxl_pmu_format_attr[cxl_pmu_crb_attr]))
+ return 0;
+
return attr->mode;
}
@@ -319,6 +333,17 @@ static u16 cxl_pmu_config2_get_hdm_decoder(struct perf_event *event)
return FIELD_GET(CXL_PMU_ATTR_CONFIG2_HDM_MSK, event->attr.config2);
}
+static u16 cxl_pmu_config1_crb_filter_en(struct perf_event *event)
+{
+ return FIELD_GET(CXL_PMU_ATTR_CONFIG1_CRB_FILTER_EN_MSK,
+ event->attr.config1);
+}
+
+static u16 cxl_pmu_config2_get_crb(struct perf_event *event)
+{
+ return FIELD_GET(CXL_PMU_ATTR_CONFIG2_CRB_MSK, event->attr.config2);
+}
+
static ssize_t cxl_pmu_event_sysfs_show(struct device *dev,
struct device_attribute *attr, char *buf)
{
@@ -571,6 +596,14 @@ static int cxl_pmu_event_init(struct perf_event *event)
return -EOPNOTSUPP;
/* TODO: Validation of any filter */
+ if (cxl_pmu_config1_crb_filter_en(event)) {
+ if (!info->filter_chan_rank_bank)
+ return -EINVAL;
+ /* only valid for DDR Interface events */
+ if (cxl_pmu_config_get_gid(event) != CXL_PMU_GID_DDR)
+ return -EINVAL;
+ }
+
/*
* Verify that it is possible to count what was requested. Either must
* be a fixed counter that is a precise match or a configurable counter
@@ -627,8 +660,8 @@ static void cxl_pmu_event_start(struct perf_event *event, int flags)
hwc->state = 0;
/*
- * Currently only hdm filter control is implemented, this code will
- * want generalizing when more filters are added.
+ * Filter ID=0: HDM decoder filter
+ * Filter ID=1: Channel/Rank/Bank (CRB) filter
*/
if (info->filter_hdm) {
if (cxl_pmu_config1_hdm_filter_en(event))
@@ -638,6 +671,14 @@ static void cxl_pmu_event_start(struct perf_event *event, int flags)
writeq(cfg, base + CXL_PMU_FILTER_CFG_REG(hwc->idx, 0));
}
+ if (info->filter_chan_rank_bank) {
+ if (cxl_pmu_config1_crb_filter_en(event))
+ cfg = cxl_pmu_config2_get_crb(event);
+ else
+ cfg = GENMASK(31, 0); /* no filtering if 0xFFFF_FFFF */
+ writeq(cfg, base + CXL_PMU_FILTER_CFG_REG(hwc->idx, 1));
+ }
+
cfg = readq(base + CXL_PMU_COUNTER_CFG_REG(hwc->idx));
cfg |= FIELD_PREP(CXL_PMU_COUNTER_CFG_INT_ON_OVRFLW, 1);
cfg |= FIELD_PREP(CXL_PMU_COUNTER_CFG_FREEZE_ON_OVRFLW, 1);
--
2.39.5
^ permalink raw reply related [flat|nested] 2+ messages in thread
* Re: [PATCH] perf/cxlpmu: Support Channel/Rank/Bank filter
2026-06-11 1:04 [PATCH] perf/cxlpmu: Support Channel/Rank/Bank filter Davidlohr Bueso
@ 2026-06-11 1:14 ` sashiko-bot
0 siblings, 0 replies; 2+ messages in thread
From: sashiko-bot @ 2026-06-11 1:14 UTC (permalink / raw)
To: Davidlohr Bueso; +Cc: linux-cxl, linux-perf-users
Thank you for your contribution! Sashiko AI review found 3 potential issue(s) to consider:
- [High] The function `cxl_pmu_config2_get_crb()` returns `u16`, silently truncating the 32-bit CRB filter value.
- [High] Using `writeq()` to program the 32-bit CRB filter register causes unaligned MMIO access and clobbers adjacent registers.
- [Low] The mask `CXL_PMU_ATTR_CONFIG2_CRB_MSK` is defined using `GENMASK(63, 32)`, causing compilation errors and undefined behavior on 32-bit architectures.
--
commit a9330e1fbdf601456995f95b96ae724e328f12a5
Author: Harshal Thakkar <harshal.t@samsung.com>
perf/cxlpmu: Support Channel/Rank/Bank filter
Implement CRB filtering per CXL 4.0 8.2.7.2.2, and extend the current filtering
support beyond HDM. These filters are only for DDR Interface events.
> diff --git a/drivers/perf/cxl_pmu.c b/drivers/perf/cxl_pmu.c
> index 68a54d97d2a8a..b709b2e6c0d95 100644
> --- a/drivers/perf/cxl_pmu.c
> +++ b/drivers/perf/cxl_pmu.c
[ ... ]
> @@ -246,7 +253,9 @@ static struct attribute *cxl_pmu_format_attr[] = {
> #define CXL_PMU_ATTR_CONFIG1_INVERT_MSK BIT(16)
> #define CXL_PMU_ATTR_CONFIG1_EDGE_MSK BIT(17)
> #define CXL_PMU_ATTR_CONFIG1_FILTER_EN_MSK BIT(18)
> +#define CXL_PMU_ATTR_CONFIG1_CRB_FILTER_EN_MSK BIT(19)
> #define CXL_PMU_ATTR_CONFIG2_HDM_MSK GENMASK(15, 0)
> +#define CXL_PMU_ATTR_CONFIG2_CRB_MSK GENMASK(63, 32)
[Severity: Low]
Does this code cause compilation errors on 32-bit architectures?
GENMASK generates an unsigned long, which is 32 bits wide on 32-bit
architectures. Shifting by 32 or more results in undefined behavior and
triggers the macro's internal BUILD_BUG_ON_ZERO(h >= BITS_PER_LONG).
Should this use GENMASK_ULL(63, 32) for a 64-bit mask?
[ ... ]
> @@ -319,6 +333,17 @@ static u16 cxl_pmu_config2_get_hdm_decoder(struct perf_event *event)
> return FIELD_GET(CXL_PMU_ATTR_CONFIG2_HDM_MSK, event->attr.config2);
> }
>
> +static u16 cxl_pmu_config1_crb_filter_en(struct perf_event *event)
> +{
> + return FIELD_GET(CXL_PMU_ATTR_CONFIG1_CRB_FILTER_EN_MSK,
> + event->attr.config1);
> +}
> +
> +static u16 cxl_pmu_config2_get_crb(struct perf_event *event)
> +{
> + return FIELD_GET(CXL_PMU_ATTR_CONFIG2_CRB_MSK, event->attr.config2);
> +}
[Severity: High]
Does this function truncate the 32-bit CRB filter value?
The CRB filter mask config2:32-63 is 32 bits wide, but
cxl_pmu_config2_get_crb() returns u16. When the 32-bit value is extracted
using FIELD_GET(), the upper 16 bits are silently dropped.
Should the return type be changed to u32 to preserve the full filter value?
[ ... ]
> @@ -627,8 +660,8 @@ static void cxl_pmu_event_start(struct perf_event *event, int flags)
> hwc->state = 0;
>
> /*
> - * Currently only hdm filter control is implemented, this code will
> - * want generalizing when more filters are added.
> + * Filter ID=0: HDM decoder filter
> + * Filter ID=1: Channel/Rank/Bank (CRB) filter
> */
> if (info->filter_hdm) {
> if (cxl_pmu_config1_hdm_filter_en(event))
> @@ -638,6 +671,14 @@ static void cxl_pmu_event_start(struct perf_event *event, int flags)
> writeq(cfg, base + CXL_PMU_FILTER_CFG_REG(hwc->idx, 0));
> }
>
> + if (info->filter_chan_rank_bank) {
> + if (cxl_pmu_config1_crb_filter_en(event))
> + cfg = cxl_pmu_config2_get_crb(event);
> + else
> + cfg = GENMASK(31, 0); /* no filtering if 0xFFFF_FFFF */
> + writeq(cfg, base + CXL_PMU_FILTER_CFG_REG(hwc->idx, 1));
[Severity: High]
Can this writeq() trigger an unaligned MMIO access fault and clobber
adjacent registers?
The CXL PMU filter configuration registers are 32 bits wide with a 4-byte
stride:
0x400 + 4 * (f + n * 8)
For f=1, CXL_PMU_FILTER_CFG_REG() resolves to an unaligned offset like
0x404. Using a 64-bit writeq() on a 4-byte unaligned device memory
address triggers undefined behavior and hardware alignment faults, such as
a Synchronous External Abort on ARM64.
Additionally, writing 64 bits to a 32-bit register clobbers the adjacent
register (f=2).
Would writel() be safer here?
> + }
> +
> cfg = readq(base + CXL_PMU_COUNTER_CFG_REG(hwc->idx));
> cfg |= FIELD_PREP(CXL_PMU_COUNTER_CFG_INT_ON_OVRFLW, 1);
> cfg |= FIELD_PREP(CXL_PMU_COUNTER_CFG_FREEZE_ON_OVRFLW, 1);
--
Sashiko AI review · https://sashiko.dev/#/patchset/20260611010409.2776635-1-dave@stgolabs.net?part=1
^ permalink raw reply [flat|nested] 2+ messages in thread
end of thread, other threads:[~2026-06-11 1:14 UTC | newest]
Thread overview: 2+ messages (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2026-06-11 1:04 [PATCH] perf/cxlpmu: Support Channel/Rank/Bank filter Davidlohr Bueso
2026-06-11 1:14 ` sashiko-bot
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox