On Mon, Feb 02, 2026 at 06:43:08PM -0300, Gustavo Sousa wrote:
> From: Shekhar Chauhan <[email protected]>
> 
> Add the initial set of workarounds for Xe3p_LPG graphics version 35.10.
> 
> Signed-off-by: Shekhar Chauhan <[email protected]>
> Co-developed-by: Nitin Gote <[email protected]>
> Signed-off-by: Nitin Gote <[email protected]>
> Co-developed-by: Tangudu Tilak Tirumalesh <[email protected]>
> Signed-off-by: Tangudu Tilak Tirumalesh <[email protected]>
> Co-developed-by: Mallesh Koujalagi <[email protected]>
> Signed-off-by: Mallesh Koujalagi <[email protected]>
> Co-developed-by: Gustavo Sousa <[email protected]>
> Signed-off-by: Gustavo Sousa <[email protected]>
> ---
>  drivers/gpu/drm/xe/regs/xe_gt_regs.h  | 19 ++++++++++++++
>  drivers/gpu/drm/xe/xe_reg_whitelist.c |  8 ++++++
>  drivers/gpu/drm/xe/xe_wa.c            | 48 
> +++++++++++++++++++++++++++++++++++
>  3 files changed, 75 insertions(+)
> 
> diff --git a/drivers/gpu/drm/xe/regs/xe_gt_regs.h 
> b/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> index 24fc64fc832e..b5a7cc45f13d 100644
> --- a/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> +++ b/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> @@ -100,6 +100,9 @@
>  #define VE1_AUX_INV                          XE_REG(0x42b8)
>  #define   AUX_INV                            REG_BIT(0)
>  
> +#define GAMSTLB_CTRL2                                XE_REG_MCR(0x4788)
> +#define   STLB_SINGLE_BANK_MODE                      REG_BIT(11)
> +
>  #define XE2_LMEM_CFG                         XE_REG(0x48b0)
>  
>  #define XE2_GAMWALK_CTRL                     0x47e4
> @@ -107,12 +110,18 @@
>  #define XE2_GAMWALK_CTRL_3D                  XE_REG_MCR(XE2_GAMWALK_CTRL)
>  #define   EN_CMP_1WCOH_GW                    REG_BIT(14)
>  
> +#define MMIOATSREQLIMIT_GAM_WALK_3D             XE_REG_MCR(0x47f8)
> +#define   DIS_ATS_WRONLY_PG                     REG_BIT(18)
> +
>  #define XEHP_FLAT_CCS_BASE_ADDR                      XE_REG_MCR(0x4910)
>  #define XEHP_FLAT_CCS_PTR                    REG_GENMASK(31, 8)
>  
>  #define WM_CHICKEN3                          XE_REG_MCR(0x5588, 
> XE_REG_OPTION_MASKED)
>  #define   HIZ_PLANE_COMPRESSION_DIS          REG_BIT(10)
>  
> +#define TBIMR_MODE                           XE_REG_MCR(0x6200, 
> XE_REG_OPTION_MASKED)
> +#define   RXBAR_NO_UAV_DEC_SYNC                      REG_BIT(12)
> +
>  #define CHICKEN_RASTER_1                     XE_REG_MCR(0x6204, 
> XE_REG_OPTION_MASKED)
>  #define   DIS_SF_ROUND_NEAREST_EVEN          REG_BIT(8)
>  #define   DIS_CLIP_NEGATIVE_BOUNDING_BOX     REG_BIT(6)
> @@ -210,6 +219,9 @@
>  
>  #define GSCPSMI_BASE                         XE_REG(0x880c)
>  
> +#define CCCHKNREG2                           XE_REG_MCR(0x881c)
> +#define  LOCALITYDIS                         REG_BIT(7)

Nitpick: the formatting is slightly off here (the field name should be
spaced over one more column).

> +
>  #define CCCHKNREG1                           XE_REG_MCR(0x8828)
>  #define   L3CMPCTRL                          REG_BIT(23)
>  #define   ENCOMPPERFFIX                              REG_BIT(18)
> @@ -420,6 +432,8 @@
>  #define   LSN_DIM_Z_WGT(value)                       
> REG_FIELD_PREP(LSN_DIM_Z_WGT_MASK, value)
>  
>  #define L3SQCREG2                            XE_REG_MCR(0xb104)
> +#define   L3_SQ_DISABLE_COAMA_2WAY_COH               REG_BIT(30)
> +#define   L3_SQ_DISABLE_COAMA                        REG_BIT(22)
>  #define   COMPMEMRD256BOVRFETCHEN            REG_BIT(20)
>  
>  #define L3SQCREG3                            XE_REG_MCR(0xb108)
> @@ -550,11 +564,16 @@
>  #define   UGM_FRAGMENT_THRESHOLD_TO_3                REG_BIT(58 - 32)
>  #define   DIS_CHAIN_2XSIMD8                  REG_BIT(55 - 32)
>  #define   XE2_ALLOC_DPA_STARVE_FIX_DIS               REG_BIT(47 - 32)
> +#define   SAMPLER_LD_LSC_DISABLE                REG_BIT(45 - 32)
>  #define   ENABLE_SMP_LD_RENDER_SURFACE_CONTROL       REG_BIT(44 - 32)
>  #define   FORCE_SLM_FENCE_SCOPE_TO_TILE              REG_BIT(42 - 32)
>  #define   FORCE_UGM_FENCE_SCOPE_TO_TILE              REG_BIT(41 - 32)
>  #define   MAXREQS_PER_BANK                   REG_GENMASK(39 - 32, 37 - 32)
>  #define   DISABLE_128B_EVICTION_COMMAND_UDW  REG_BIT(36 - 32)
> +#define   LSCFE_SAME_ADDRESS_ATOMICS_COALESCING_DISABLE      REG_BIT(35 - 32)
> +
> +#define ROW_CHICKEN5                         XE_REG_MCR(0xe7f0)
> +#define   CPSS_AWARE_DIS                     REG_BIT(3)
>  
>  #define SARB_CHICKEN1                                XE_REG_MCR(0xe90c)
>  #define   COMP_CKN_IN                                REG_GENMASK(30, 29)
> diff --git a/drivers/gpu/drm/xe/xe_reg_whitelist.c 
> b/drivers/gpu/drm/xe/xe_reg_whitelist.c
> index 1d36c09681aa..9c513778d370 100644
> --- a/drivers/gpu/drm/xe/xe_reg_whitelist.c
> +++ b/drivers/gpu/drm/xe/xe_reg_whitelist.c
> @@ -81,6 +81,14 @@ static const struct xe_rtp_entry_sr register_whitelist[] = 
> {
>                        WHITELIST(VFLSKPD,
>                                  RING_FORCE_TO_NONPRIV_ACCESS_RW))
>       },
> +     { XE_RTP_NAME("14024997852"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> +                    ENGINE_CLASS(RENDER)),
> +       XE_RTP_ACTIONS(WHITELIST(FF_MODE,
> +                                RING_FORCE_TO_NONPRIV_ACCESS_RW),
> +                      WHITELIST(VFLSKPD,
> +                                RING_FORCE_TO_NONPRIV_ACCESS_RW))
> +     },
>  
>  #define WHITELIST_OA_MMIO_TRG(trg, status, head) \
>       WHITELIST(trg, RING_FORCE_TO_NONPRIV_ACCESS_RW), \
> diff --git a/drivers/gpu/drm/xe/xe_wa.c b/drivers/gpu/drm/xe/xe_wa.c
> index a991ee2b8781..68a494743b34 100644
> --- a/drivers/gpu/drm/xe/xe_wa.c
> +++ b/drivers/gpu/drm/xe/xe_wa.c
> @@ -306,6 +306,31 @@ static const struct xe_rtp_entry_sr gt_was[] = {
>         XE_RTP_RULES(GRAPHICS_VERSION_RANGE(3000, 3005)),
>         XE_RTP_ACTIONS(SET(GUC_INTR_CHICKEN, DISABLE_SIGNALING_ENGINES))
>       },
> +
> +     /* Xe3P_LPG */
> +
> +     { XE_RTP_NAME("14025160223"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> +       XE_RTP_ACTIONS(SET(MMIOATSREQLIMIT_GAM_WALK_3D,
> +                          DIS_ATS_WRONLY_PG))
> +     },
> +     { XE_RTP_NAME("16028780921"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> +       XE_RTP_ACTIONS(SET(CCCHKNREG2, LOCALITYDIS))
> +     },
> +     { XE_RTP_NAME("14026144927"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> +       XE_RTP_ACTIONS(SET(L3SQCREG2, L3_SQ_DISABLE_COAMA_2WAY_COH |
> +                          L3_SQ_DISABLE_COAMA))
> +     },
> +     { XE_RTP_NAME("14025635424"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> +       XE_RTP_ACTIONS(SET(GAMSTLB_CTRL2, STLB_SINGLE_BANK_MODE))
> +     },
> +     { XE_RTP_NAME("16028005424"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> +       XE_RTP_ACTIONS(SET(GUC_INTR_CHICKEN, DISABLE_SIGNALING_ENGINES))
> +     },
>  };
>  
>  static const struct xe_rtp_entry_sr engine_was[] = {
> @@ -680,6 +705,24 @@ static const struct xe_rtp_entry_sr engine_was[] = {
>                      FUNC(xe_rtp_match_gt_has_discontiguous_dss_groups)),
>         XE_RTP_ACTIONS(SET(TDL_CHICKEN, EUSTALL_PERF_SAMPLING_DISABLE))
>       },
> +
> +     /* Xe3p_LPG*/
> +
> +     { XE_RTP_NAME("22021149932"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> +                    FUNC(xe_rtp_match_first_render_or_compute)),
> +       XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW, SAMPLER_LD_LSC_DISABLE))
> +     },
> +     { XE_RTP_NAME("14025676848"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> +                    FUNC(xe_rtp_match_first_render_or_compute)),
> +       XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW, 
> LSCFE_SAME_ADDRESS_ATOMICS_COALESCING_DISABLE))
> +     },
> +     { XE_RTP_NAME("16028951944"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> +                    FUNC(xe_rtp_match_first_render_or_compute)),
> +       XE_RTP_ACTIONS(SET(ROW_CHICKEN5, CPSS_AWARE_DIS))
> +     },
>  };
>  
>  static const struct xe_rtp_entry_sr lrc_was[] = {
> @@ -879,6 +922,11 @@ static const struct xe_rtp_entry_sr lrc_was[] = {
>                      ENGINE_CLASS(RENDER)),
>         XE_RTP_ACTIONS(SET(CHICKEN_RASTER_1, DIS_CLIP_NEGATIVE_BOUNDING_BOX))
>       },
> +     { XE_RTP_NAME("14025780377"),
> +       XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> +                    ENGINE_CLASS(RENDER)),
> +       XE_RTP_ACTIONS(SET(TBIMR_MODE, RXBAR_NO_UAV_DEC_SYNC))

I'm not sure if this one is actually needed.  Originally the workaround
ticket just said "program 0x6200[12]" but it's since been updated to an
"if (por) no workaround needed, else if (non-POR thing) program the
register and add a stalling flush."  There are also comments in the
ticket itself that indicate it shouldn't actually be relevant to this
specific platform due to other characteristics of the platform; it's
just something that they'll need to fix or workaround in the future so
that it doesn't impact future derivative platforms.


Matt

> +     },
>  };
>  
>  static __maybe_unused const struct xe_rtp_entry oob_was[] = {
> 
> -- 
> 2.52.0
> 

-- 
Matt Roper
Graphics Software Engineer
Linux GPU Platform Enablement
Intel Corporation

Reply via email to