On Mon, Feb 02, 2026 at 06:43:08PM -0300, Gustavo Sousa wrote:
> From: Shekhar Chauhan <[email protected]>
>
> Add the initial set of workarounds for Xe3p_LPG graphics version 35.10.
>
> Signed-off-by: Shekhar Chauhan <[email protected]>
> Co-developed-by: Nitin Gote <[email protected]>
> Signed-off-by: Nitin Gote <[email protected]>
> Co-developed-by: Tangudu Tilak Tirumalesh <[email protected]>
> Signed-off-by: Tangudu Tilak Tirumalesh <[email protected]>
> Co-developed-by: Mallesh Koujalagi <[email protected]>
> Signed-off-by: Mallesh Koujalagi <[email protected]>
> Co-developed-by: Gustavo Sousa <[email protected]>
> Signed-off-by: Gustavo Sousa <[email protected]>
> ---
> drivers/gpu/drm/xe/regs/xe_gt_regs.h | 19 ++++++++++++++
> drivers/gpu/drm/xe/xe_reg_whitelist.c | 8 ++++++
> drivers/gpu/drm/xe/xe_wa.c | 48
> +++++++++++++++++++++++++++++++++++
> 3 files changed, 75 insertions(+)
>
> diff --git a/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> b/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> index 24fc64fc832e..b5a7cc45f13d 100644
> --- a/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> +++ b/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> @@ -100,6 +100,9 @@
> #define VE1_AUX_INV XE_REG(0x42b8)
> #define AUX_INV REG_BIT(0)
>
> +#define GAMSTLB_CTRL2 XE_REG_MCR(0x4788)
> +#define STLB_SINGLE_BANK_MODE REG_BIT(11)
> +
> #define XE2_LMEM_CFG XE_REG(0x48b0)
>
> #define XE2_GAMWALK_CTRL 0x47e4
> @@ -107,12 +110,18 @@
> #define XE2_GAMWALK_CTRL_3D XE_REG_MCR(XE2_GAMWALK_CTRL)
> #define EN_CMP_1WCOH_GW REG_BIT(14)
>
> +#define MMIOATSREQLIMIT_GAM_WALK_3D XE_REG_MCR(0x47f8)
> +#define DIS_ATS_WRONLY_PG REG_BIT(18)
> +
> #define XEHP_FLAT_CCS_BASE_ADDR XE_REG_MCR(0x4910)
> #define XEHP_FLAT_CCS_PTR REG_GENMASK(31, 8)
>
> #define WM_CHICKEN3 XE_REG_MCR(0x5588,
> XE_REG_OPTION_MASKED)
> #define HIZ_PLANE_COMPRESSION_DIS REG_BIT(10)
>
> +#define TBIMR_MODE XE_REG_MCR(0x6200,
> XE_REG_OPTION_MASKED)
> +#define RXBAR_NO_UAV_DEC_SYNC REG_BIT(12)
> +
> #define CHICKEN_RASTER_1 XE_REG_MCR(0x6204,
> XE_REG_OPTION_MASKED)
> #define DIS_SF_ROUND_NEAREST_EVEN REG_BIT(8)
> #define DIS_CLIP_NEGATIVE_BOUNDING_BOX REG_BIT(6)
> @@ -210,6 +219,9 @@
>
> #define GSCPSMI_BASE XE_REG(0x880c)
>
> +#define CCCHKNREG2 XE_REG_MCR(0x881c)
> +#define LOCALITYDIS REG_BIT(7)
Nitpick: the formatting is slightly off here (the field name should be
spaced over one more column).
> +
> #define CCCHKNREG1 XE_REG_MCR(0x8828)
> #define L3CMPCTRL REG_BIT(23)
> #define ENCOMPPERFFIX REG_BIT(18)
> @@ -420,6 +432,8 @@
> #define LSN_DIM_Z_WGT(value)
> REG_FIELD_PREP(LSN_DIM_Z_WGT_MASK, value)
>
> #define L3SQCREG2 XE_REG_MCR(0xb104)
> +#define L3_SQ_DISABLE_COAMA_2WAY_COH REG_BIT(30)
> +#define L3_SQ_DISABLE_COAMA REG_BIT(22)
> #define COMPMEMRD256BOVRFETCHEN REG_BIT(20)
>
> #define L3SQCREG3 XE_REG_MCR(0xb108)
> @@ -550,11 +564,16 @@
> #define UGM_FRAGMENT_THRESHOLD_TO_3 REG_BIT(58 - 32)
> #define DIS_CHAIN_2XSIMD8 REG_BIT(55 - 32)
> #define XE2_ALLOC_DPA_STARVE_FIX_DIS REG_BIT(47 - 32)
> +#define SAMPLER_LD_LSC_DISABLE REG_BIT(45 - 32)
> #define ENABLE_SMP_LD_RENDER_SURFACE_CONTROL REG_BIT(44 - 32)
> #define FORCE_SLM_FENCE_SCOPE_TO_TILE REG_BIT(42 - 32)
> #define FORCE_UGM_FENCE_SCOPE_TO_TILE REG_BIT(41 - 32)
> #define MAXREQS_PER_BANK REG_GENMASK(39 - 32, 37 - 32)
> #define DISABLE_128B_EVICTION_COMMAND_UDW REG_BIT(36 - 32)
> +#define LSCFE_SAME_ADDRESS_ATOMICS_COALESCING_DISABLE REG_BIT(35 - 32)
> +
> +#define ROW_CHICKEN5 XE_REG_MCR(0xe7f0)
> +#define CPSS_AWARE_DIS REG_BIT(3)
>
> #define SARB_CHICKEN1 XE_REG_MCR(0xe90c)
> #define COMP_CKN_IN REG_GENMASK(30, 29)
> diff --git a/drivers/gpu/drm/xe/xe_reg_whitelist.c
> b/drivers/gpu/drm/xe/xe_reg_whitelist.c
> index 1d36c09681aa..9c513778d370 100644
> --- a/drivers/gpu/drm/xe/xe_reg_whitelist.c
> +++ b/drivers/gpu/drm/xe/xe_reg_whitelist.c
> @@ -81,6 +81,14 @@ static const struct xe_rtp_entry_sr register_whitelist[] =
> {
> WHITELIST(VFLSKPD,
> RING_FORCE_TO_NONPRIV_ACCESS_RW))
> },
> + { XE_RTP_NAME("14024997852"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> + ENGINE_CLASS(RENDER)),
> + XE_RTP_ACTIONS(WHITELIST(FF_MODE,
> + RING_FORCE_TO_NONPRIV_ACCESS_RW),
> + WHITELIST(VFLSKPD,
> + RING_FORCE_TO_NONPRIV_ACCESS_RW))
> + },
>
> #define WHITELIST_OA_MMIO_TRG(trg, status, head) \
> WHITELIST(trg, RING_FORCE_TO_NONPRIV_ACCESS_RW), \
> diff --git a/drivers/gpu/drm/xe/xe_wa.c b/drivers/gpu/drm/xe/xe_wa.c
> index a991ee2b8781..68a494743b34 100644
> --- a/drivers/gpu/drm/xe/xe_wa.c
> +++ b/drivers/gpu/drm/xe/xe_wa.c
> @@ -306,6 +306,31 @@ static const struct xe_rtp_entry_sr gt_was[] = {
> XE_RTP_RULES(GRAPHICS_VERSION_RANGE(3000, 3005)),
> XE_RTP_ACTIONS(SET(GUC_INTR_CHICKEN, DISABLE_SIGNALING_ENGINES))
> },
> +
> + /* Xe3P_LPG */
> +
> + { XE_RTP_NAME("14025160223"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> + XE_RTP_ACTIONS(SET(MMIOATSREQLIMIT_GAM_WALK_3D,
> + DIS_ATS_WRONLY_PG))
> + },
> + { XE_RTP_NAME("16028780921"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> + XE_RTP_ACTIONS(SET(CCCHKNREG2, LOCALITYDIS))
> + },
> + { XE_RTP_NAME("14026144927"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> + XE_RTP_ACTIONS(SET(L3SQCREG2, L3_SQ_DISABLE_COAMA_2WAY_COH |
> + L3_SQ_DISABLE_COAMA))
> + },
> + { XE_RTP_NAME("14025635424"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> + XE_RTP_ACTIONS(SET(GAMSTLB_CTRL2, STLB_SINGLE_BANK_MODE))
> + },
> + { XE_RTP_NAME("16028005424"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0)),
> + XE_RTP_ACTIONS(SET(GUC_INTR_CHICKEN, DISABLE_SIGNALING_ENGINES))
> + },
> };
>
> static const struct xe_rtp_entry_sr engine_was[] = {
> @@ -680,6 +705,24 @@ static const struct xe_rtp_entry_sr engine_was[] = {
> FUNC(xe_rtp_match_gt_has_discontiguous_dss_groups)),
> XE_RTP_ACTIONS(SET(TDL_CHICKEN, EUSTALL_PERF_SAMPLING_DISABLE))
> },
> +
> + /* Xe3p_LPG*/
> +
> + { XE_RTP_NAME("22021149932"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> + FUNC(xe_rtp_match_first_render_or_compute)),
> + XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW, SAMPLER_LD_LSC_DISABLE))
> + },
> + { XE_RTP_NAME("14025676848"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> + FUNC(xe_rtp_match_first_render_or_compute)),
> + XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW,
> LSCFE_SAME_ADDRESS_ATOMICS_COALESCING_DISABLE))
> + },
> + { XE_RTP_NAME("16028951944"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> + FUNC(xe_rtp_match_first_render_or_compute)),
> + XE_RTP_ACTIONS(SET(ROW_CHICKEN5, CPSS_AWARE_DIS))
> + },
> };
>
> static const struct xe_rtp_entry_sr lrc_was[] = {
> @@ -879,6 +922,11 @@ static const struct xe_rtp_entry_sr lrc_was[] = {
> ENGINE_CLASS(RENDER)),
> XE_RTP_ACTIONS(SET(CHICKEN_RASTER_1, DIS_CLIP_NEGATIVE_BOUNDING_BOX))
> },
> + { XE_RTP_NAME("14025780377"),
> + XE_RTP_RULES(GRAPHICS_VERSION(3510), GRAPHICS_STEP(A0, B0),
> + ENGINE_CLASS(RENDER)),
> + XE_RTP_ACTIONS(SET(TBIMR_MODE, RXBAR_NO_UAV_DEC_SYNC))
I'm not sure if this one is actually needed. Originally the workaround
ticket just said "program 0x6200[12]" but it's since been updated to an
"if (por) no workaround needed, else if (non-POR thing) program the
register and add a stalling flush." There are also comments in the
ticket itself that indicate it shouldn't actually be relevant to this
specific platform due to other characteristics of the platform; it's
just something that they'll need to fix or workaround in the future so
that it doesn't impact future derivative platforms.
Matt
> + },
> };
>
> static __maybe_unused const struct xe_rtp_entry oob_was[] = {
>
> --
> 2.52.0
>
--
Matt Roper
Graphics Software Engineer
Linux GPU Platform Enablement
Intel Corporation