Mali-Gx20 and Mali-Gx25 deprecates the use of FLUSH_MEM and FLUSH_PT
MMU_AS commands in favour of cache maintenance via
GPU_COMMAND's FLUSH_CACHES and FLUSH_PA_RANGE.
They also introduce the following registers:
- GPU_COMMAND_ARG0~1
- SHADER_PWRFEATURES
- AMBA_FEATURES
- AMBA_ENABLE
This patch enables FLUSH_CACHES for both families of GPUs via the
PANTHOR_HW_FEATURE_GPU_CTRL_CACHE_FLUSH bit until FLUSH_PA_RANGE support
is added. It also adds the aforementioned register definitions and
firmware binary support for arch 12.8 and 13.8.
Signed-off-by: Karunika Choo <karunika.choo@arm.com>
---
drivers/gpu/drm/panthor/panthor_fw.c | 2 ++
drivers/gpu/drm/panthor/panthor_hw.c | 30 ++++++++++++++++++++++++++
drivers/gpu/drm/panthor/panthor_regs.h | 12 +++++++++++
3 files changed, 44 insertions(+)
diff --git a/drivers/gpu/drm/panthor/panthor_fw.c b/drivers/gpu/drm/panthor/panthor_fw.c
index fa6e0b48a0b2..9bf06e55eaee 100644
--- a/drivers/gpu/drm/panthor/panthor_fw.c
+++ b/drivers/gpu/drm/panthor/panthor_fw.c
@@ -1405,3 +1405,5 @@ MODULE_FIRMWARE("arm/mali/arch10.8/mali_csffw.bin");
MODULE_FIRMWARE("arm/mali/arch10.10/mali_csffw.bin");
MODULE_FIRMWARE("arm/mali/arch10.12/mali_csffw.bin");
MODULE_FIRMWARE("arm/mali/arch11.8/mali_csffw.bin");
+MODULE_FIRMWARE("arm/mali/arch12.8/mali_csffw.bin");
+MODULE_FIRMWARE("arm/mali/arch13.8/mali_csffw.bin");
diff --git a/drivers/gpu/drm/panthor/panthor_hw.c b/drivers/gpu/drm/panthor/panthor_hw.c
index 5ec9d7f28368..281d86c4715e 100644
--- a/drivers/gpu/drm/panthor/panthor_hw.c
+++ b/drivers/gpu/drm/panthor/panthor_hw.c
@@ -61,6 +61,24 @@ static char *get_gpu_model_name(struct panthor_device *ptdev)
fallthrough;
case GPU_PROD_ID_MAKE(11, 3):
return "Mali-G615";
+ case GPU_PROD_ID_MAKE(12, 0):
+ if (shader_core_count >= 10 && ray_intersection)
+ return "Mali-G720-Immortalis";
+ else if (shader_core_count >= 6)
+ return "Mali-G720";
+
+ fallthrough;
+ case GPU_PROD_ID_MAKE(12, 1):
+ return "Mali-G620";
+ case GPU_PROD_ID_MAKE(13, 0):
+ if (shader_core_count >= 10 && ray_intersection)
+ return "Mali-G925-Immortalis";
+ else if (shader_core_count >= 6)
+ return "Mali-G725";
+
+ fallthrough;
+ case GPU_PROD_ID_MAKE(13, 1):
+ return "Mali-G625";
}
return "(Unknown Mali GPU)";
@@ -109,6 +127,18 @@ static struct panthor_hw panthor_hw_devices[] = {
BIT(PANTHOR_HW_FEATURE_GPU_CTRL_CACHE_FLUSH)
},
},
+ {
+ .arch_major = 12,
+ .features = {
+ BIT(PANTHOR_HW_FEATURE_GPU_CTRL_CACHE_FLUSH)
+ },
+ },
+ {
+ .arch_major = 13,
+ .features = {
+ BIT(PANTHOR_HW_FEATURE_GPU_CTRL_CACHE_FLUSH)
+ },
+ },
};
static int init_gpu_id(struct panthor_device *ptdev)
diff --git a/drivers/gpu/drm/panthor/panthor_regs.h b/drivers/gpu/drm/panthor/panthor_regs.h
index 4eaa2b612756..8e01440f8743 100644
--- a/drivers/gpu/drm/panthor/panthor_regs.h
+++ b/drivers/gpu/drm/panthor/panthor_regs.h
@@ -89,6 +89,8 @@
#define GPU_DOORBELL_FEATURES 0xC0
+#define GPU_COMMAND_ARG(n) (0xD0 + ((n) * 8))
+
#define GPU_SHADER_PRESENT 0x100
#define GPU_TILER_PRESENT 0x110
#define GPU_L2_PRESENT 0x120
@@ -98,6 +100,8 @@
#define L2_READY 0x160
#define SHADER_PWRON 0x180
+#define SHADER_PWRFEATURES 0x188
+#define SHADER_PWRFEATURES_RAY_TRACING_UNIT BIT(0)
#define TILER_PWRON 0x190
#define L2_PWRON 0x1A0
@@ -125,6 +129,13 @@
#define GPU_COHERENCY_ACE 1
#define GPU_COHERENCY_NONE 31
+#define AMBA_FEATURES 0x300
+#define AMBA_FEATURES_ACE_LITE BIT(0)
+#define AMBA_FEATURES_ACE BIT(1)
+#define AMBA_FEATURES_SHAREABLE_CACHE_SUPPORT BIT(5)
+
+#define AMBA_ENABLE 0x304
+
#define GPU_SYSC_PBHA_OVERRIDE(n) (0x320 + ((n) * 4))
#define GPU_SYSC_ALLOC(n) (0x340 + ((n) * 4))
@@ -138,6 +149,7 @@
#define MCU_STATUS_ENABLED 1
#define MCU_STATUS_HALT 2
#define MCU_STATUS_FATAL 3
+#define MCU_FEATURES 0x708
/* Job Control regs */
#define JOB_INT_RAWSTAT 0x1000
--
2.49.0
On Mon, Jun 2, 2025 at 7:34 AM Karunika Choo <karunika.choo@arm.com> wrote: > > Mali-Gx20 and Mali-Gx25 deprecates the use of FLUSH_MEM and FLUSH_PT > MMU_AS commands in favour of cache maintenance via > GPU_COMMAND's FLUSH_CACHES and FLUSH_PA_RANGE. > > They also introduce the following registers: > - GPU_COMMAND_ARG0~1 > - SHADER_PWRFEATURES > - AMBA_FEATURES > - AMBA_ENABLE > > This patch enables FLUSH_CACHES for both families of GPUs via the > PANTHOR_HW_FEATURE_GPU_CTRL_CACHE_FLUSH bit until FLUSH_PA_RANGE support > is added. It also adds the aforementioned register definitions and > firmware binary support for arch 12.8 and 13.8. <snipped> > diff --git a/drivers/gpu/drm/panthor/panthor_regs.h b/drivers/gpu/drm/panthor/panthor_regs.h > index 4eaa2b612756..8e01440f8743 100644 > --- a/drivers/gpu/drm/panthor/panthor_regs.h > +++ b/drivers/gpu/drm/panthor/panthor_regs.h > @@ -89,6 +89,8 @@ > > #define GPU_DOORBELL_FEATURES 0xC0 > > +#define GPU_COMMAND_ARG(n) (0xD0 + ((n) * 8)) > + > #define GPU_SHADER_PRESENT 0x100 > #define GPU_TILER_PRESENT 0x110 > #define GPU_L2_PRESENT 0x120 > @@ -98,6 +100,8 @@ > #define L2_READY 0x160 > > #define SHADER_PWRON 0x180 > +#define SHADER_PWRFEATURES 0x188 > +#define SHADER_PWRFEATURES_RAY_TRACING_UNIT BIT(0) > #define TILER_PWRON 0x190 > #define L2_PWRON 0x1A0 > > @@ -125,6 +129,13 @@ > #define GPU_COHERENCY_ACE 1 > #define GPU_COHERENCY_NONE 31 > > +#define AMBA_FEATURES 0x300 > +#define AMBA_FEATURES_ACE_LITE BIT(0) > +#define AMBA_FEATURES_ACE BIT(1) > +#define AMBA_FEATURES_SHAREABLE_CACHE_SUPPORT BIT(5) > + > +#define AMBA_ENABLE 0x304 We still use GPU_COHERENCY_FEATURES / GPU_COHERENCY_PROTOCOL even on v12 and v13. I suppose they are compatible with AMBA_FEATURES / AMBA_ENABLE to some degree? We should unify them.
On 11/06/2025 00:45, Chia-I Wu wrote: > On Mon, Jun 2, 2025 at 7:34 AM Karunika Choo <karunika.choo@arm.com> wrote: >> >> Mali-Gx20 and Mali-Gx25 deprecates the use of FLUSH_MEM and FLUSH_PT >> MMU_AS commands in favour of cache maintenance via >> GPU_COMMAND's FLUSH_CACHES and FLUSH_PA_RANGE. >> >> They also introduce the following registers: >> - GPU_COMMAND_ARG0~1 >> - SHADER_PWRFEATURES >> - AMBA_FEATURES >> - AMBA_ENABLE >> >> This patch enables FLUSH_CACHES for both families of GPUs via the >> PANTHOR_HW_FEATURE_GPU_CTRL_CACHE_FLUSH bit until FLUSH_PA_RANGE support >> is added. It also adds the aforementioned register definitions and >> firmware binary support for arch 12.8 and 13.8. > <snipped> >> diff --git a/drivers/gpu/drm/panthor/panthor_regs.h b/drivers/gpu/drm/panthor/panthor_regs.h >> index 4eaa2b612756..8e01440f8743 100644 >> --- a/drivers/gpu/drm/panthor/panthor_regs.h >> +++ b/drivers/gpu/drm/panthor/panthor_regs.h >> @@ -89,6 +89,8 @@ >> >> #define GPU_DOORBELL_FEATURES 0xC0 >> >> +#define GPU_COMMAND_ARG(n) (0xD0 + ((n) * 8)) >> + >> #define GPU_SHADER_PRESENT 0x100 >> #define GPU_TILER_PRESENT 0x110 >> #define GPU_L2_PRESENT 0x120 >> @@ -98,6 +100,8 @@ >> #define L2_READY 0x160 >> >> #define SHADER_PWRON 0x180 >> +#define SHADER_PWRFEATURES 0x188 >> +#define SHADER_PWRFEATURES_RAY_TRACING_UNIT BIT(0) >> #define TILER_PWRON 0x190 >> #define L2_PWRON 0x1A0 >> >> @@ -125,6 +129,13 @@ >> #define GPU_COHERENCY_ACE 1 >> #define GPU_COHERENCY_NONE 31 >> >> +#define AMBA_FEATURES 0x300 >> +#define AMBA_FEATURES_ACE_LITE BIT(0) >> +#define AMBA_FEATURES_ACE BIT(1) >> +#define AMBA_FEATURES_SHAREABLE_CACHE_SUPPORT BIT(5) >> + >> +#define AMBA_ENABLE 0x304 > We still use GPU_COHERENCY_FEATURES / GPU_COHERENCY_PROTOCOL even on > v12 and v13. I suppose they are compatible with AMBA_FEATURES / > AMBA_ENABLE to some degree? We should unify them. Hello, Due to some changes in the fields between AMBA_ENABLE and GPU_COHERENCY_PROTOCOL, namely SHAREABLE_CACHE_SUPPORT, which has a value of BIT(5), the previous assumption that FEATURE = BIT(PROTOCOL) for GPU_COHERENCY_FEATURES is no longer valid. As such, I have updated the field Macros for GPU_COHERENCY_FEATURES to enable merging of the two register fields. Hopefully this addresses your comments. Kind regards, Karunika
© 2016 - 2025 Red Hat, Inc.