All of lore.kernel.org
 help / color / mirror / Atom feed
From: Riana Tauro <riana.tauro@intel.com>
To: "Mallesh, Koujalagi" <mallesh.koujalagi@intel.com>
Cc: <anshuman.gupta@intel.com>, <rodrigo.vivi@intel.com>,
	<aravind.iddamsetty@linux.intel.com>, <badal.nilawar@intel.com>,
	<raag.jadav@intel.com>, <ravi.kishore.koppuravuri@intel.com>,
	<intel-xe@lists.freedesktop.org>
Subject: Re: [PATCH v2 09/11] drm/xe/xe_ras: Add structures for SoC Internal errors
Date: Wed, 11 Mar 2026 20:21:49 +0530	[thread overview]
Message-ID: <bb0159e9-18d2-4991-965b-89dea538384a@intel.com> (raw)
In-Reply-To: <4c4e9f47-c04a-4426-91ed-b415532d9dde@intel.com>



On 3/10/2026 6:32 PM, Mallesh, Koujalagi wrote:
> 
> On 02-03-2026 03:52 pm, Riana Tauro wrote:
>> Add response structures for SoC Internal errors.
>>
>> Signed-off-by: Riana Tauro <riana.tauro@intel.com>
>> ---
>>   drivers/gpu/drm/xe/xe_ras_types.h | 134 ++++++++++++++++++++++++++++++
>>   1 file changed, 134 insertions(+)
>>
>> diff --git a/drivers/gpu/drm/xe/xe_ras_types.h b/drivers/gpu/drm/xe/ 
>> xe_ras_types.h
>> index 221d07efd84c..466db9f47127 100644
>> --- a/drivers/gpu/drm/xe/xe_ras_types.h
>> +++ b/drivers/gpu/drm/xe/xe_ras_types.h
>> @@ -145,4 +145,138 @@ struct xe_ras_compute_error {
>>       u32 spare_log3;
>>   } __packed;
> Add hardware component glossary to more understanding.

Sorry didn't get this.

>> +/**
>> + * struct xe_ras_soc_error_source - Source of SOC error
>> + */
>> +struct xe_ras_soc_error_source {
>> +    /** @csc: CSC error */
>> +    u32 csc:1;
>> +    /** @soc: SOC error */
>> +    u32 soc:1;
>> +    /** @reserved: Reserved for future use */
>> +    u32 reserved:30;
>> +} __packed;
>> +
>> +/**
>> + * struct xe_ras_soc_error - SOC error details
>> + */
>> +struct xe_ras_soc_error {
>> +    /** @error_source: Error Source */
>> +    struct xe_ras_soc_error_source error_source;
>> +    /** @additional_details: Additional details */
>> +    u32 additional_details[15];
> Use Macro

This is remaining part of existing macro

+#define XE_RAS_MAX_ERROR_DETAILS	16

This is not used across files and adding a macro
for every array creates unnecessary defines for a single
file. If we explicitly change or use this array
we can add it.

>> +} __packed;
>> +
>> +/**
>> + * struct xe_ras_csc_error - CSC error details
>> + */
>> +struct xe_ras_csc_error {
>> +    /** @hec_uncorr_err_status: CSC error */
>> +    u32 hec_uncorr_err_status;
>> +    /** @hec_uncorr_fw_err_dw0: CSC f/w error */
>> +    u32 hec_uncorr_fw_err_dw0;
>> +} __packed;
>> +
>> +/**
>> + * struct xe_ras_ieh_error - SoC IEH error details
>> + */
>> +struct xe_ras_ieh_error {
>> +    /** @ieh_instance: IEH instance */
>> +    u32 ieh_instance:2;
>> +    /** @reserved: Reserved for future use */
>> +    u32 reserved:30;
>> +    union {
>> +        /** @global_error_status: Global error status */
>> +        u32 global_error_status;
>> +        /** @error_sources_ieh0: Error sources for IEH0 */
>> +        struct {
>> +            /** @psf0_psf1_npk: PSF0, PSF1, NPK */
>> +            u32 psf0_psf1_npk:1;
>> +            /** @punit: PUNIT */
>> +            u32 punit:1;
>> +            /** @reserved_2: Reserved */
>> +            u32 reserved_2:1;
>> +            /** @oobmsm: OOBMSM */
>> +            u32 oobmsm:1;
>> +            /** @i2c: I2C */
>> +            u32 i2c:1;
>> +            /** @pciess_gpma: PCIESS GPMA */
>> +            u32 pciess_gpma:1;
>> +            /** @lpioss_pma: LPIOSS PMA */
>> +            u32 lpioss_pma:1;
>> +            /** @fabss0_pma: FabSS0 PMA */
>> +            u32 fabss0_pma:1;
>> +            /** @fabss1_pma: FabSS1 PMA */
>> +            u32 fabss1_pma:1;
>> +            /** @reserved_9: Reserved */
>> +            u32 reserved_9:1;
>> +            /** @reserved_10: Reserved */
>> +            u32 reserved_10:1;
>> +            /** @reserved_11: Reserved */
>> +            u32 reserved_11:1;
>> +            /** @reserved_12: Reserved */
>> +            u32 reserved_12:1;
>> +            /** @reserved_13: Reserved */
>> +            u32 reserved_13:1;
>> +            /** @memss_ieh1: MEMSS -> IEH1 */
>> +            u32 memss_ieh1:1;
>> +            /** @memss_ieh2: MEMSS -> IEH2 */
>> +            u32 memss_ieh2:1;
>> +            /** @saf0_mhb0: SAF0 MHB0 */
>> +            u32 saf0_mhb0:1;
>> +            /** @saf0_mhb1: SAF0 MHB1 */
>> +            u32 saf0_mhb1:1;
>> +             /** @saf0_mhb2: SAF0 MHB2 */
> Please remove space

Thanks. Will remove it.

>> +            u32 saf0_mhb2:1;
>> +            /** @saf0_mhb3: SAF0 MHB3 */
>> +            u32 saf0_mhb3:1;
>> +            /** @saf0_mhb4: SAF0 MHB4 */
>> +            u32 saf0_mhb4:1;
>> +            /** @saf0_mhb5: SAF0 MHB5 */
>> +            u32 saf0_mhb5:1;
>> +            /** @saf0_mhb6: SAF0 MHB6 */
>> +            u32 saf0_mhb6:1;
>> +            /** @saf0_mhb7: SAF0 MHB7 */
>> +            u32 saf0_mhb7:1;
>> +            /** @saf1_mhb0: SAF1 MHB0 */
>> +            u32 saf1_mhb0:1;
>> +            /** @saf1_mhb1: SAF1 MHB1 */
>> +            u32 saf1_mhb1:1;
>> +            /** @saf1_mhb2: SAF1 MHB2 */
>> +            u32 saf1_mhb2:1;
>> +            /** @saf1_mhb3: SAF1 MHB3 */
>> +            u32 saf1_mhb3:1;
>> +            /** @saf1_mhb4: SAF1 MHB4 */
>> +            u32 saf1_mhb4:1;
>> +            /** @saf1_mhb5: SAF1 MHB5 */
>> +            u32 saf1_mhb5:1;
>> +            /** @saf1_mhb6: SAF1 MHB6 */
>> +            u32 saf1_mhb6:1;
>> +            /** @saf1_mhb7: SAF1 MHB7 */
>> +            u32 saf1_mhb7:1;
>> +        } error_sources_ieh0;
>> +    };
>> +
>> +    /** @lerr_status_ieh0: Local error status of IEH0 */
>> +    struct {
>> +        /** @reserved_0: Reserved for future use */
>> +        u32 reserved_0:1;
>> +        /** @psf0: PSF0 */
>> +        u32 psf0:1;
>> +        /** @psf1: PSF1 */
>> +        u32 psf1:1;
>> +        /** @reserved_26: Reserved */
>> +        u32 reserved_26:26;
> Reserved bit 3_28 right?, need to change name

Will just rename it to reserved 0,1,2 instead of bits

>> +        /** @npk: NPK */
>> +        u32 npk:1;
>> +        /** @reserved_30: Reserved */
>> +        u32 reserved_30:2;
> Reserved bit 30_31 right?
>> +    } lerr_status_ieh0;
>> +
>> +    /** @gerr_mask: Global error mask */
>> +    u32 gerr_mask;
>> +    /** @additional_info: Additional information */
>> +    u32 additional_info[10];
> 
> ditto above

Replied above

Thanks
Riana

> 
> Thanks
> 
> -/Mallesh
> 
>> +} __packed;
>> +
>>   #endif


  reply	other threads:[~2026-03-11 14:52 UTC|newest]

Thread overview: 43+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2026-03-02 10:21 [PATCH v2 00/11] Introduce Xe Uncorrectable Error Handling Riana Tauro
2026-03-02 10:21 ` [PATCH v2 01/11] drm/xe/xe_sysctrl: Add System controller patch Riana Tauro
2026-03-02 10:21 ` [PATCH v2 02/11] drm/xe/xe_survivability: Decouple survivability info from boot survivability Riana Tauro
2026-03-02 17:00   ` Raag Jadav
2026-03-03  8:18     ` Mallesh, Koujalagi
2026-03-30 12:56       ` Tauro, Riana
2026-03-30 13:00     ` Tauro, Riana
2026-03-02 10:21 ` [PATCH v2 03/11] drm/xe/xe_pci_error: Implement PCI error recovery callbacks Riana Tauro
2026-03-02 17:37   ` Raag Jadav
2026-03-03  5:09     ` Riana Tauro
2026-03-04 10:38   ` Mallesh, Koujalagi
2026-03-31  5:18     ` Tauro, Riana
2026-03-02 10:21 ` [PATCH v2 04/11] drm/xe/xe_pci_error: Group all devres to release them on PCIe slot reset Riana Tauro
2026-03-02 10:22 ` [PATCH v2 05/11] drm/xe: Skip device access during PCI error recovery Riana Tauro
2026-03-04 10:59   ` Mallesh, Koujalagi
2026-03-02 10:22 ` [PATCH v2 06/11] drm/xe/xe_ras: Initialize Uncorrectable AER Registers Riana Tauro
2026-03-02 10:22 ` [PATCH v2 07/11] drm/xe/xe_ras: Add structures and commands for Uncorrectable Core Compute Errors Riana Tauro
2026-03-04 16:32   ` Raag Jadav
2026-03-31 16:14     ` Tauro, Riana
2026-04-01  6:25       ` Raag Jadav
2026-04-01  6:39         ` Tauro, Riana
2026-03-02 10:22 ` [PATCH v2 08/11] drm/xe/xe_ras: Add support for Uncorrectable Core-Compute errors Riana Tauro
2026-03-04 16:52   ` Raag Jadav
2026-03-06 18:37     ` Raag Jadav
2026-03-31 16:24     ` Tauro, Riana
2026-04-01  6:34       ` Raag Jadav
2026-04-01  6:47         ` Tauro, Riana
2026-03-06  3:50   ` [v2,08/11] " Purkait, Soham
2026-03-31 16:16     ` Tauro, Riana
2026-03-02 10:22 ` [PATCH v2 09/11] drm/xe/xe_ras: Add structures for SoC Internal errors Riana Tauro
2026-03-10 13:02   ` Mallesh, Koujalagi
2026-03-11 14:51     ` Riana Tauro [this message]
2026-03-02 10:22 ` [PATCH v2 10/11] drm/xe/xe_ras: Handle Uncorrectable " Riana Tauro
2026-03-10 13:29   ` Mallesh, Koujalagi
2026-03-11 14:55     ` Riana Tauro
2026-03-02 10:22 ` [PATCH v2 11/11] drm/xe/xe_pci_error: Process errors in mmio_enabled Riana Tauro
2026-03-11  7:10   ` Mallesh, Koujalagi
2026-03-11 14:39     ` Riana Tauro
2026-03-12  8:08       ` Mallesh, Koujalagi
2026-03-02 16:10 ` ✗ CI.checkpatch: warning for Introduce Xe Uncorrectable Error Handling (rev2) Patchwork
2026-03-02 16:11 ` ✓ CI.KUnit: success " Patchwork
2026-03-02 16:48 ` ✓ Xe.CI.BAT: " Patchwork
2026-03-02 18:29 ` ✗ Xe.CI.FULL: failure " Patchwork

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=bb0159e9-18d2-4991-965b-89dea538384a@intel.com \
    --to=riana.tauro@intel.com \
    --cc=anshuman.gupta@intel.com \
    --cc=aravind.iddamsetty@linux.intel.com \
    --cc=badal.nilawar@intel.com \
    --cc=intel-xe@lists.freedesktop.org \
    --cc=mallesh.koujalagi@intel.com \
    --cc=raag.jadav@intel.com \
    --cc=ravi.kishore.koppuravuri@intel.com \
    --cc=rodrigo.vivi@intel.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.