On 11/06/2026 17:04, Karunika Choo wrote:
> On 11/06/2026 16:18, Steven Price wrote:
>> On 28/05/2026 16:05, Karunika Choo wrote:
>>> Add the panthor hardware description for Mali v15 GPUs and hook it into
>>> device matching.
>>>
>>> This includes the v15 register map and product identification needed to
>>> populate the GPU information exposed by the driver and its uAPI.
>>>
>>> Add compatibility string for v15 GPUs.
>>>
>>> Signed-off-by: Karunika Choo <[email protected]>
>>> ---
>>> drivers/gpu/drm/panthor/panthor_drv.c | 1 +
>>> drivers/gpu/drm/panthor/panthor_fw.c | 1 +
>>> .../drm/panthor/panthor_gpu_discover_regs.h | 25 ++++++
>>> drivers/gpu/drm/panthor/panthor_heap.c | 3 +-
>>> drivers/gpu/drm/panthor/panthor_hw.c | 81 ++++++++++++++++++-
>>> drivers/gpu/drm/panthor/panthor_hw.h | 13 +++
>>> include/uapi/drm/panthor_drm.h | 10 ++-
>>> 7 files changed, 128 insertions(+), 6 deletions(-)
>>>
>>> diff --git a/drivers/gpu/drm/panthor/panthor_drv.c
>>> b/drivers/gpu/drm/panthor/panthor_drv.c
>>> index e8dc4096c1d2..21644a60c8e4 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_drv.c
>>> +++ b/drivers/gpu/drm/panthor/panthor_drv.c
>>> @@ -1875,6 +1875,7 @@ static const struct of_device_id dt_match[] = {
>>> { .compatible = "mediatek,mt8196-mali", .data =
>>> &soc_data_mediatek_mt8196, },
>>> { .compatible = "rockchip,rk3588-mali" },
>>> { .compatible = "arm,mali-valhall-csf" },
>>> + { .compatible = "arm,mali-gen5-am" },
>>
>> Just a heads up: a new DT compatible should have a binding document
>> describing it. So this can't be merged until the DT bindings change is
>> agreed.
>>
>
> In this case are we leaning more towards a new arm,mali-gen5-am.yaml
> or is it preferrable to update arm/mali-valhall-csf.yaml instead?
You've probably got a better idea of how similar it is to
mali-valhall-csf.yaml. I don't have a preference as to how it's
documented - although others might. But we get into issues if the
bindings aren't agreed before the code using them is merged.
Thanks,
Steve
>>> {}
>>> };
>>> MODULE_DEVICE_TABLE(of, dt_match);
>>> diff --git a/drivers/gpu/drm/panthor/panthor_fw.c
>>> b/drivers/gpu/drm/panthor/panthor_fw.c
>>> index f6381f5f236f..e2a511b741f4 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_fw.c
>>> +++ b/drivers/gpu/drm/panthor/panthor_fw.c
>>> @@ -1529,3 +1529,4 @@ MODULE_FIRMWARE("arm/mali/arch11.8/mali_csffw.bin");
>>> MODULE_FIRMWARE("arm/mali/arch12.8/mali_csffw.bin");
>>> MODULE_FIRMWARE("arm/mali/arch13.8/mali_csffw.bin");
>>> MODULE_FIRMWARE("arm/mali/arch14.8/mali_csffw.bin");
>>> +MODULE_FIRMWARE("arm/mali/arch15.8/mali_csffw.bin");
>>> diff --git a/drivers/gpu/drm/panthor/panthor_gpu_discover_regs.h
>>> b/drivers/gpu/drm/panthor/panthor_gpu_discover_regs.h
>>> index 54bb104902ee..9c64676dc35a 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_gpu_discover_regs.h
>>> +++ b/drivers/gpu/drm/panthor/panthor_gpu_discover_regs.h
>>> @@ -14,4 +14,29 @@
>>> #define GPU_WIDE_VER_MINOR(x) (((x) &
>>> GENMASK(15, 8)) >> 8)
>>> #define GPU_WIDE_VER_STATUS(x) ((x) & GENMASK(7, 0))
>>>
>>> +#define DISCOVER_REVIDR 0x8
>>> +#define DISCOVER_GPU_FEATURES 0x20
>>> +#define GPU_FEATURES_VARIABLE_RATE_SHADING BIT(0)
>>> +#define GPU_FEATURES_SIMD_STATE BIT(1)
>>> +#define GPU_FEATURES_CROSS_STREAM_SYNC BIT(3)
>>> +#define GPU_FEATURES_NX BIT(4)
>>> +#define GPU_FEATURES_RAY_TRAVERSAL BIT(5)
>>> +#define GPU_FEATURES_LD_LEA_TENSOR_INSTRUCTIONS BIT(6)
>>> +#define DISCOVER_MCU_FEATURES 0x40
>>> +#define DISCOVER_PRFCNT_FEATURES 0x50
>>> +#define PRFCNT_FEATURES_COUNTER_BLOCK_SIZE(x) (((x) &
>>> GENMASK(7, 0)) << 8)
>>> +#define DISCOVER_DOORBELL_FEATURES 0x60
>>> +#define DISCOVER_MEM_FEATURES 0x100
>>> +#define DISCOVER_MMU_FEATURES 0x108
>>> +#define MMU_FEATURES_AS_COUNT(x) (((x) & GENMASK(23,
>>> 16)) >> 16)
>>> +#define DISCOVER_AMBA_FEATURES 0x120
>>> +
>>> +#define DISCOVER_L2_FEATURES 0x128
>>> +#define DISCOVER_TILER_FEATURES 0x200
>>> +#define DISCOVER_CORE_FEATURES 0x300
>>> +#define DISCOVER_THREAD_FEATURES 0x320
>>> +#define DISCOVER_THREAD_MAX_THREADS 0x330
>>> +#define DISCOVER_THREAD_NUM_ACTIVE_GRANULARITY 0x334
>>> +#define DISCOVER_TEXTURE_FEATURES 0x360
>>> +
>>> #endif /* __PANTHOR_GPU_DISCOVER_REGS_H__ */
>>> diff --git a/drivers/gpu/drm/panthor/panthor_heap.c
>>> b/drivers/gpu/drm/panthor/panthor_heap.c
>>> index 99311abdf1e9..afb7d68abc87 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_heap.c
>>> +++ b/drivers/gpu/drm/panthor/panthor_heap.c
>>> @@ -11,6 +11,7 @@
>>> #include "panthor_gem.h"
>>> #include "panthor_gpu_regs.h"
>>> #include "panthor_heap.h"
>>> +#include "panthor_hw.h"
>>> #include "panthor_mmu.h"
>>>
>>> /*
>>> @@ -105,7 +106,7 @@ struct panthor_heap_pool {
>>>
>>> static int panthor_heap_ctx_stride(struct panthor_device *ptdev)
>>> {
>>> - u32 l2_features = ptdev->gpu_info.l2_features;
>>> + u64 l2_features = panthor_hw_get_l2_features(ptdev);
>>> u32 gpu_cache_line_size = GPU_L2_FEATURES_LINE_SIZE(l2_features);
>>>
>>> return ALIGN(HEAP_CONTEXT_SIZE, gpu_cache_line_size);
>>> diff --git a/drivers/gpu/drm/panthor/panthor_hw.c
>>> b/drivers/gpu/drm/panthor/panthor_hw.c
>>> index e677f1a8f488..52271fb9db52 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_hw.c
>>> +++ b/drivers/gpu/drm/panthor/panthor_hw.c
>>> @@ -65,6 +65,23 @@ static struct panthor_hw panthor_hw_arch_v14 = {
>>> },
>>> };
>>>
>>> +static struct panthor_hw panthor_hw_arch_v15 = {
>>> + .ops = {
>>> + .soft_reset = panthor_pwr_reset_soft,
>>> + .l2_power_off = panthor_pwr_l2_power_off,
>>> + .l2_power_on = panthor_pwr_l2_power_on,
>>> + },
>>> + .map = {
>>> + .gpu_control_base = 0x3000,
>>> + .pwr_control_base = 0x3800,
>>> + .mcu_control_base = 0x3100,
>>> + .mmu_as = {
>>> + .base = 0x2800,
>>> + .stride = 0x80,
>>> + },
>>> + },
>>> +};
>>> +
>>> static struct panthor_hw_entry panthor_hw_match[] = {
>>> {
>>> .arch_min = 10,
>>> @@ -76,6 +93,11 @@ static struct panthor_hw_entry panthor_hw_match[] = {
>>> .arch_max = 14,
>>> .hwdev = &panthor_hw_arch_v14,
>>> },
>>> + {
>>> + .arch_min = 15,
>>> + .arch_max = 15,
>>> + .hwdev = &panthor_hw_arch_v15,
>>> + }
>>> };
>>>
>>> static int panthor_hw_set_power_tracing(struct device *dev, void *data)
>>> @@ -187,6 +209,12 @@ static char *get_gpu_model_name(struct panthor_device
>>> *ptdev)
>>> return "Mali-G1-Premium";
>>> case GPU_PROD_ID_MAKE(14, 3):
>>> return "Mali-G1-Pro";
>>> + case GPU_PROD_ID_MAKE(15, 0):
>>> + return "Mali-G2-Ultra";
>>> + case GPU_PROD_ID_MAKE(15, 1):
>>> + return "Mali-G2-Premium";
>>> + case GPU_PROD_ID_MAKE(15, 3):
>>> + return "Mali-G2-Pro";
>>> }
>>>
>>> return "(Unknown Mali GPU)";
>>> @@ -210,7 +238,7 @@ static int overload_shader_present(struct
>>> panthor_device *ptdev)
>>> return 0;
>>> }
>>>
>>> -static int panthor_gpu_info_init(struct panthor_device *ptdev)
>>> +static void panthor_gpu_info_v10_init(struct panthor_device *ptdev)
>>> {
>>> unsigned int i;
>>>
>>> @@ -251,12 +279,56 @@ static int panthor_gpu_info_init(struct
>>> panthor_device *ptdev)
>>> ptdev->gpu_info.tiler_present = gpu_read64(gpu_iomem,
>>> GPU_TILER_PRESENT);
>>> ptdev->gpu_info.l2_present = gpu_read64(gpu_iomem,
>>> GPU_L2_PRESENT);
>>> }
>>> +}
>>> +
>>> +static void panthor_gpu_info_v15_init(struct panthor_device *ptdev)
>>> +{
>>> + void __iomem *pwr_iomem = ptdev->iomem +
>>> ptdev->hw->map.pwr_control_base;
>>> + u64 texture_features;
>>> +
>>> + ptdev->gpu_info.gpu_rev_wide = gpu_read64(ptdev->iomem,
>>> DISCOVER_REVIDR);
>>> + ptdev->gpu_info.l2_features_wide = gpu_read64(ptdev->iomem,
>>> DISCOVER_L2_FEATURES);
>>> +
>>> + texture_features = gpu_read64(ptdev->iomem, DISCOVER_TEXTURE_FEATURES);
>>> + ptdev->gpu_info.texture_features[0] = lower_32_bits(texture_features);
>>> + ptdev->gpu_info.texture_features[1] = upper_32_bits(texture_features);
>>> +
>>> + ptdev->gpu_info.thread_features = gpu_read(ptdev->iomem,
>>> DISCOVER_THREAD_FEATURES);
>>> + ptdev->gpu_info.max_threads = gpu_read(ptdev->iomem,
>>> DISCOVER_THREAD_MAX_THREADS);
>>> + ptdev->gpu_info.thread_num_active_granularity =
>>> + gpu_read(ptdev->iomem, DISCOVER_THREAD_NUM_ACTIVE_GRANULARITY);
>>> +
>>> + ptdev->gpu_info.gpu_features = gpu_read64(ptdev->iomem,
>>> DISCOVER_GPU_FEATURES);
>>> +
>>> + /* The following _HI registers do not contain any information (yet) */
>>
>> This is a little confusing as a comment - there are no "_HI" registers
>> mentioned. I think this would be better reworded as "32 bit reads are
>> used as the HI part of the 64 bit register does not contian any
>> information (yet)" (or similar).
>
> ACK.
>
>> Or alternatively you could just upgrade these to 64 bit and be done with
>> it ;)
>>
>>> + ptdev->gpu_info.mem_features = gpu_read(ptdev->iomem,
>>> DISCOVER_MEM_FEATURES);
>>> + ptdev->gpu_info.mmu_features = gpu_read(ptdev->iomem,
>>> DISCOVER_MMU_FEATURES);
>>> + ptdev->gpu_info.coherency_features = gpu_read(ptdev->iomem,
>>> DISCOVER_AMBA_FEATURES);
>>> + ptdev->gpu_info.tiler_features = gpu_read(ptdev->iomem,
>>> DISCOVER_TILER_FEATURES);
>>> + ptdev->gpu_info.core_features = gpu_read(ptdev->iomem,
>>> DISCOVER_CORE_FEATURES);
>>> +
>>> + /* AS_PRESENT register removed on v15+ create virtual mask from
>>> MMU_FEATURES.AS_COUNT */
>>> + ptdev->gpu_info.as_present =
>>> + (1U << MMU_FEATURES_AS_COUNT(ptdev->gpu_info.mmu_features)) - 1;
>>
>> This might be better expressed using GENMASK:
>>
>> GENMASK(MMU_FEATURES_AS_COUNT(ptdev->gpu_info.mmu_features) - 1, 0)
>>
>
> ACK.
>
> Kind regards,
> Karunika
>
>>> +
>>> + ptdev->gpu_info.l2_present = gpu_read64(pwr_iomem, PWR_L2_PRESENT);
>>> + ptdev->gpu_info.tiler_present = gpu_read64(pwr_iomem,
>>> PWR_TILER_PRESENT);
>>> + ptdev->gpu_info.shader_present = gpu_read64(pwr_iomem,
>>> PWR_SHADER_PRESENT);
>>> +}
>>> +
>>> +static int panthor_gpu_info_init(struct panthor_device *ptdev)
>>> +{
>>> + if (panthor_hw_has_gpu_discover(ptdev))
>>> + panthor_gpu_info_v15_init(ptdev);
>>> + else
>>> + panthor_gpu_info_v10_init(ptdev);
>>>
>>> return overload_shader_present(ptdev);
>>> }
>>>
>>> static int panthor_hw_info_init(struct panthor_device *ptdev)
>>> {
>>> + u64 l2_features = ptdev->gpu_info.l2_features;
>>> u32 major, minor, status;
>>> int ret;
>>>
>>> @@ -268,14 +340,17 @@ static int panthor_hw_info_init(struct panthor_device
>>> *ptdev)
>>> minor = ptdev->gpu_id.ver.minor;
>>> status = ptdev->gpu_id.ver.status;
>>>
>>> + if (panthor_hw_has_gpu_discover(ptdev))
>>> + l2_features = ptdev->gpu_info.l2_features_wide;
>>> +
>>> drm_info(&ptdev->base,
>>> "%s id 0x%x major 0x%x minor 0x%x status 0x%x",
>>> get_gpu_model_name(ptdev), ptdev->gpu_id.prod_major,
>>> major, minor, status);
>>>
>>> drm_info(&ptdev->base,
>>> - "Features: L2:%#x Tiler:%#x Mem:%#x MMU:%#x AS:%#x",
>>> - ptdev->gpu_info.l2_features,
>>> + "Features: L2:%#llx Tiler:%#x Mem:%#x MMU:%#x AS:%#x",
>>> + l2_features,
>>> ptdev->gpu_info.tiler_features,
>>> ptdev->gpu_info.mem_features,
>>> ptdev->gpu_info.mmu_features,
>>> diff --git a/drivers/gpu/drm/panthor/panthor_hw.h
>>> b/drivers/gpu/drm/panthor/panthor_hw.h
>>> index 0ae11b78c77e..1b2678ea00db 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_hw.h
>>> +++ b/drivers/gpu/drm/panthor/panthor_hw.h
>>> @@ -83,4 +83,17 @@ static inline bool panthor_hw_has_pwr_ctrl(struct
>>> panthor_device *ptdev)
>>> return ptdev->gpu_id.arch.major >= 14;
>>> }
>>>
>>> +static inline bool panthor_hw_has_gpu_discover(struct panthor_device
>>> *ptdev)
>>> +{
>>> + return ptdev->gpu_id.arch.major >= 15;
>>> +}
>>> +
>>> +static inline u64 panthor_hw_get_l2_features(struct panthor_device *ptdev)
>>> +{
>>> + if (panthor_hw_has_gpu_discover(ptdev))
>>> + return ptdev->gpu_info.l2_features_wide;
>>> +
>>> + return ptdev->gpu_info.l2_features;
>>> +}
>>> +
>>> #endif /* __PANTHOR_HW_H__ */
>>> diff --git a/include/uapi/drm/panthor_drm.h b/include/uapi/drm/panthor_drm.h
>>> index 04fc9f133152..2ecc50eade27 100644
>>> --- a/include/uapi/drm/panthor_drm.h
>>> +++ b/include/uapi/drm/panthor_drm.h
>>> @@ -368,8 +368,8 @@ struct drm_panthor_gpu_info {
>>> /** @core_features: Used to discriminate core variants when they exist.
>>> */
>>> __u32 core_features;
>>>
>>> - /** @pad: MBZ. */
>>> - __u32 pad;
>>> + /** @thread_num_active_granularity: Granularity of number of active
>>> threads */
>>> + __u32 thread_num_active_granularity;
>>>
>>> /** @gpu_features: Bitmask describing supported GPU-wide features */
>>> __u64 gpu_features;
>>> @@ -383,6 +383,12 @@ struct drm_panthor_gpu_info {
>>> #define DRM_PANTHOR_WIDE_VERSION_MAJOR(x) (((x) >> 16) & 0xff)
>>> #define DRM_PANTHOR_WIDE_VERSION_MINOR(x) (((x) >> 8) & 0xff)
>>> #define DRM_PANTHOR_WIDE_VERSION_STATUS(x) ((x) & 0xff)
>>> +
>>> + /** @gpu_rev_wide: 64-bit GPU revision for v15 onwards */
>>> + __u64 gpu_rev_wide;
>>> +
>>> + /** @l2_features_wide: 64-bit L2_FEATURES for v15 onwards */
>>> + __u64 l2_features_wide;
>>> };
>>>
>>> /**
>>
>