Initialise the GSP resource manager arguments (rmargs) which provide
initialisation parameters to the GSP firmware during boot. The rmargs
structure contains arguments to configure the GSP message/command queue
location.
These are mapped for coherent DMA and added to the libos data structure
for access when booting GSP.
Signed-off-by: Alistair Popple <apopple@nvidia.com>
---
Changes for v2:
- Rebased on Alex's latest series
---
drivers/gpu/nova-core/gsp.rs | 29 +++++++++++++++-
drivers/gpu/nova-core/gsp/cmdq.rs | 14 ++++++--
drivers/gpu/nova-core/gsp/fw.rs | 19 +++++++++++
.../gpu/nova-core/gsp/fw/r570_144/bindings.rs | 33 +++++++++++++++++++
4 files changed, 91 insertions(+), 4 deletions(-)
diff --git a/drivers/gpu/nova-core/gsp.rs b/drivers/gpu/nova-core/gsp.rs
index 3d4028d67d2e..bb08bd537ec4 100644
--- a/drivers/gpu/nova-core/gsp.rs
+++ b/drivers/gpu/nova-core/gsp.rs
@@ -17,7 +17,10 @@
use crate::fb::FbLayout;
use crate::gsp::cmdq::GspCmdq;
-use fw::LibosMemoryRegionInitArgument;
+use fw::{
+ LibosMemoryRegionInitArgument, GSP_ARGUMENTS_CACHED, GSP_SR_INIT_ARGUMENTS,
+ MESSAGE_QUEUE_INIT_ARGUMENTS,
+};
pub(crate) mod cmdq;
@@ -33,6 +36,7 @@ pub(crate) struct Gsp {
pub logintr: CoherentAllocation<u8>,
pub logrm: CoherentAllocation<u8>,
pub cmdq: GspCmdq,
+ rmargs: CoherentAllocation<GSP_ARGUMENTS_CACHED>,
}
/// Creates a self-mapping page table for `obj` at its beginning.
@@ -90,12 +94,35 @@ pub(crate) fn new(pdev: &pci::Device<device::Bound>) -> Result<impl PinInit<Self
// Creates its own PTE array
let cmdq = GspCmdq::new(dev)?;
+ let rmargs =
+ create_coherent_dma_object::<GSP_ARGUMENTS_CACHED>(dev, "RMARGS", 1, &mut libos, 3)?;
+ let (shared_mem_phys_addr, cmd_queue_offset, stat_queue_offset) = cmdq.get_cmdq_offsets();
+
+ dma_write!(
+ rmargs[0].messageQueueInitArguments = MESSAGE_QUEUE_INIT_ARGUMENTS {
+ sharedMemPhysAddr: shared_mem_phys_addr,
+ pageTableEntryCount: cmdq.nr_ptes,
+ cmdQueueOffset: cmd_queue_offset,
+ statQueueOffset: stat_queue_offset,
+ ..Default::default()
+ }
+ )?;
+ dma_write!(
+ rmargs[0].srInitArguments = GSP_SR_INIT_ARGUMENTS {
+ oldLevel: 0,
+ flags: 0,
+ bInPMTransition: 0,
+ ..Default::default()
+ }
+ )?;
+ dma_write!(rmargs[0].bDmemStack = 1)?;
Ok(try_pin_init!(Self {
libos,
loginit,
logintr,
logrm,
+ rmargs,
cmdq,
}))
}
diff --git a/drivers/gpu/nova-core/gsp/cmdq.rs b/drivers/gpu/nova-core/gsp/cmdq.rs
index a9ba1a4c73d8..9170ccf4a064 100644
--- a/drivers/gpu/nova-core/gsp/cmdq.rs
+++ b/drivers/gpu/nova-core/gsp/cmdq.rs
@@ -99,7 +99,6 @@ fn new(dev: &device::Device<device::Bound>) -> Result<Self> {
Ok(Self(gsp_mem))
}
- #[expect(unused)]
fn dma_handle(&self) -> DmaAddress {
self.0.dma_handle()
}
@@ -218,7 +217,7 @@ pub(crate) struct GspCmdq {
dev: ARef<device::Device>,
seq: u32,
gsp_mem: DmaGspMem,
- pub _nr_ptes: u32,
+ pub nr_ptes: u32,
}
impl GspCmdq {
@@ -231,7 +230,7 @@ pub(crate) fn new(dev: &device::Device<device::Bound>) -> Result<GspCmdq> {
dev: dev.into(),
seq: 0,
gsp_mem,
- _nr_ptes: nr_ptes as u32,
+ nr_ptes: nr_ptes as u32,
})
}
@@ -382,6 +381,15 @@ pub(crate) fn receive_msg_from_gsp<M: GspMessageFromGsp, R>(
.advance_cpu_read_ptr(msg_header.rpc.length.div_ceil(GSP_PAGE_SIZE as u32));
result
}
+
+ pub(crate) fn get_cmdq_offsets(&self) -> (u64, u64, u64) {
+ (
+ self.gsp_mem.dma_handle(),
+ core::mem::offset_of!(Msgq, msgq) as u64,
+ (core::mem::offset_of!(GspMem, gspq) - core::mem::offset_of!(GspMem, cpuq)
+ + core::mem::offset_of!(Msgq, msgq)) as u64,
+ )
+ }
}
fn decode_gsp_function(function: u32) -> &'static str {
diff --git a/drivers/gpu/nova-core/gsp/fw.rs b/drivers/gpu/nova-core/gsp/fw.rs
index 2e4255301e58..06841b103328 100644
--- a/drivers/gpu/nova-core/gsp/fw.rs
+++ b/drivers/gpu/nova-core/gsp/fw.rs
@@ -158,9 +158,15 @@ pub(crate) fn new(gsp_firmware: &GspFirmware, fb_layout: &FbLayout) -> Self {
}
pub(crate) use r570_144::{
+ GSP_ARGUMENTS_CACHED,
+
// GSP firmware constants
GSP_FW_WPR_META_MAGIC,
GSP_FW_WPR_META_REVISION,
+ GSP_SR_INIT_ARGUMENTS,
+
+ // RM message queue parameters
+ MESSAGE_QUEUE_INIT_ARGUMENTS,
// GSP events
NV_VGPU_MSG_EVENT_GSP_INIT_DONE,
@@ -313,3 +319,16 @@ pub(crate) fn new(sequence: u32, cmd_size: usize, function: u32) -> Self {
}
}
}
+
+// SAFETY: Padding is explicit and will not contain uninitialized data.
+unsafe impl AsBytes for GSP_ARGUMENTS_CACHED {}
+
+// SAFETY: This struct only contains integer types for which all bit patterns
+// are valid.
+unsafe impl FromBytes for GSP_ARGUMENTS_CACHED {}
+
+// SAFETY: Padding is explicit and will not contain uninitialized data.
+unsafe impl AsBytes for MESSAGE_QUEUE_INIT_ARGUMENTS {}
+
+// SAFETY: Padding is explicit and will not contain uninitialized data.
+unsafe impl AsBytes for GSP_SR_INIT_ARGUMENTS {}
diff --git a/drivers/gpu/nova-core/gsp/fw/r570_144/bindings.rs b/drivers/gpu/nova-core/gsp/fw/r570_144/bindings.rs
index 3d96d91e5b12..b87c4e6cb857 100644
--- a/drivers/gpu/nova-core/gsp/fw/r570_144/bindings.rs
+++ b/drivers/gpu/nova-core/gsp/fw/r570_144/bindings.rs
@@ -319,6 +319,39 @@ fn fmt(&self, fmt: &mut ::core::fmt::Formatter<'_>) -> ::core::fmt::Result {
pub const NV_VGPU_MSG_EVENT_NUM_EVENTS: _bindgen_ty_3 = 4131;
pub type _bindgen_ty_3 = ffi::c_uint;
#[repr(C)]
+#[derive(Debug, Default, Copy, Clone)]
+pub struct MESSAGE_QUEUE_INIT_ARGUMENTS {
+ pub sharedMemPhysAddr: u64_,
+ pub pageTableEntryCount: u32_,
+ pub __bindgen_padding_0: [u8; 4usize],
+ pub cmdQueueOffset: u64_,
+ pub statQueueOffset: u64_,
+}
+#[repr(C)]
+#[derive(Debug, Default, Copy, Clone)]
+pub struct GSP_SR_INIT_ARGUMENTS {
+ pub oldLevel: u32_,
+ pub flags: u32_,
+ pub bInPMTransition: u8_,
+ pub __bindgen_padding_0: [u8; 3usize],
+}
+#[repr(C)]
+#[derive(Debug, Default, Copy, Clone)]
+pub struct GSP_ARGUMENTS_CACHED {
+ pub messageQueueInitArguments: MESSAGE_QUEUE_INIT_ARGUMENTS,
+ pub srInitArguments: GSP_SR_INIT_ARGUMENTS,
+ pub gpuInstance: u32_,
+ pub bDmemStack: u8_,
+ pub __bindgen_padding_0: [u8; 7usize],
+ pub profilerArgs: GSP_ARGUMENTS_CACHED__bindgen_ty_1,
+}
+#[repr(C)]
+#[derive(Debug, Default, Copy, Clone)]
+pub struct GSP_ARGUMENTS_CACHED__bindgen_ty_1 {
+ pub pa: u64_,
+ pub size: u64_,
+}
+#[repr(C)]
#[derive(Copy, Clone)]
pub union rpc_message_rpc_union_field_v03_00 {
pub spare: u32_,
--
2.50.1
On Mon Sep 22, 2025 at 8:30 PM JST, Alistair Popple wrote:
> Initialise the GSP resource manager arguments (rmargs) which provide
> initialisation parameters to the GSP firmware during boot. The rmargs
> structure contains arguments to configure the GSP message/command queue
> location.
>
> These are mapped for coherent DMA and added to the libos data structure
> for access when booting GSP.
>
> Signed-off-by: Alistair Popple <apopple@nvidia.com>
>
> ---
>
> Changes for v2:
> - Rebased on Alex's latest series
> ---
> drivers/gpu/nova-core/gsp.rs | 29 +++++++++++++++-
> drivers/gpu/nova-core/gsp/cmdq.rs | 14 ++++++--
> drivers/gpu/nova-core/gsp/fw.rs | 19 +++++++++++
> .../gpu/nova-core/gsp/fw/r570_144/bindings.rs | 33 +++++++++++++++++++
> 4 files changed, 91 insertions(+), 4 deletions(-)
>
> diff --git a/drivers/gpu/nova-core/gsp.rs b/drivers/gpu/nova-core/gsp.rs
> index 3d4028d67d2e..bb08bd537ec4 100644
> --- a/drivers/gpu/nova-core/gsp.rs
> +++ b/drivers/gpu/nova-core/gsp.rs
> @@ -17,7 +17,10 @@
> use crate::fb::FbLayout;
> use crate::gsp::cmdq::GspCmdq;
>
> -use fw::LibosMemoryRegionInitArgument;
> +use fw::{
> + LibosMemoryRegionInitArgument, GSP_ARGUMENTS_CACHED, GSP_SR_INIT_ARGUMENTS,
> + MESSAGE_QUEUE_INIT_ARGUMENTS,
> +};
>
> pub(crate) mod cmdq;
>
> @@ -33,6 +36,7 @@ pub(crate) struct Gsp {
> pub logintr: CoherentAllocation<u8>,
> pub logrm: CoherentAllocation<u8>,
> pub cmdq: GspCmdq,
> + rmargs: CoherentAllocation<GSP_ARGUMENTS_CACHED>,
> }
>
> /// Creates a self-mapping page table for `obj` at its beginning.
> @@ -90,12 +94,35 @@ pub(crate) fn new(pdev: &pci::Device<device::Bound>) -> Result<impl PinInit<Self
>
> // Creates its own PTE array
> let cmdq = GspCmdq::new(dev)?;
> + let rmargs =
> + create_coherent_dma_object::<GSP_ARGUMENTS_CACHED>(dev, "RMARGS", 1, &mut libos, 3)?;
> + let (shared_mem_phys_addr, cmd_queue_offset, stat_queue_offset) = cmdq.get_cmdq_offsets();
> +
> + dma_write!(
> + rmargs[0].messageQueueInitArguments = MESSAGE_QUEUE_INIT_ARGUMENTS {
> + sharedMemPhysAddr: shared_mem_phys_addr,
> + pageTableEntryCount: cmdq.nr_ptes,
> + cmdQueueOffset: cmd_queue_offset,
> + statQueueOffset: stat_queue_offset,
> + ..Default::default()
> + }
> + )?;
> + dma_write!(
> + rmargs[0].srInitArguments = GSP_SR_INIT_ARGUMENTS {
> + oldLevel: 0,
> + flags: 0,
> + bInPMTransition: 0,
> + ..Default::default()
> + }
> + )?;
> + dma_write!(rmargs[0].bDmemStack = 1)?;
Wrapping our bindings is going to help clean up this code as well.
First, types named in CAPITALS_SNAKE_CASE are not idiomatic Rust and
look like constants. And it's not even like the bindings types are
consistently named that way, since we also have e.g. `GspFwWprMeta` - so
let's give them a proper public name and bring some consistency at the
same time.
This will make all the fields from `GSP_ARGUMENTS_CACHED` invisible to
this module as they should be, so the wrapping `GspArgumentsCached` type
should then have a constructor that receives a referene to the command
queue and takes the information is needs from it, similarly to
`GspFwWprMeta`. This will reduce the 3 `dma_write!` into a single one.
Then we should remove `get_cmdq_offsets`, which is super confusing. I am
also not fond of `cmdq.nr_ptes`. More on them below.
>
> Ok(try_pin_init!(Self {
> libos,
> loginit,
> logintr,
> logrm,
> + rmargs,
> cmdq,
> }))
> }
> diff --git a/drivers/gpu/nova-core/gsp/cmdq.rs b/drivers/gpu/nova-core/gsp/cmdq.rs
> index a9ba1a4c73d8..9170ccf4a064 100644
> --- a/drivers/gpu/nova-core/gsp/cmdq.rs
> +++ b/drivers/gpu/nova-core/gsp/cmdq.rs
> @@ -99,7 +99,6 @@ fn new(dev: &device::Device<device::Bound>) -> Result<Self> {
> Ok(Self(gsp_mem))
> }
>
> - #[expect(unused)]
> fn dma_handle(&self) -> DmaAddress {
> self.0.dma_handle()
> }
> @@ -218,7 +217,7 @@ pub(crate) struct GspCmdq {
> dev: ARef<device::Device>,
> seq: u32,
> gsp_mem: DmaGspMem,
> - pub _nr_ptes: u32,
> + pub nr_ptes: u32,
> }
>
> impl GspCmdq {
> @@ -231,7 +230,7 @@ pub(crate) fn new(dev: &device::Device<device::Bound>) -> Result<GspCmdq> {
> dev: dev.into(),
> seq: 0,
> gsp_mem,
> - _nr_ptes: nr_ptes as u32,
> + nr_ptes: nr_ptes as u32,
> })
> }
>
> @@ -382,6 +381,15 @@ pub(crate) fn receive_msg_from_gsp<M: GspMessageFromGsp, R>(
> .advance_cpu_read_ptr(msg_header.rpc.length.div_ceil(GSP_PAGE_SIZE as u32));
> result
> }
> +
> + pub(crate) fn get_cmdq_offsets(&self) -> (u64, u64, u64) {
> + (
> + self.gsp_mem.dma_handle(),
> + core::mem::offset_of!(Msgq, msgq) as u64,
> + (core::mem::offset_of!(GspMem, gspq) - core::mem::offset_of!(GspMem, cpuq)
> + + core::mem::offset_of!(Msgq, msgq)) as u64,
> + )
> + }
So this thing returns 3 u64s, one of which is actually a DMA handle,
while the two others are technically constants. The only thing that
needs to be inferred at runtime is the DMA handle - all the rest is
static.
So we can make the two last returned values associated constants of
`GspCmdq`:
impl GspCmdq {
/// Offset of the data after the PTEs.
const POST_PTE_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq);
/// Offset of command queue ring buffer.
pub(crate) const CMDQ_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq)
+ core::mem::offset_of!(Msgq, msgq)
- Self::POST_PTE_OFFSET;
/// Offset of message queue ring buffer.
pub(crate) const STATQ_OFFSET: usize = core::mem::offset_of!(GspMem, gspq)
+ core::mem::offset_of!(Msgq, msgq)
- Self::POST_PTE_OFFSET;
`GspArgumentsCached::new` can then import `GspCmdq` and use these to
initialize its corresponding members.
Remains `nr_ptes`. It was introduced in the previous patch as follows:
let nr_ptes = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
Which turns out to also be a constant! So let's add it next to the others:
impl GspCmdq {
...
/// Number of page table entries for the GSP shared region.
pub(crate) const NUM_PTES: usize = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
And you can remove `GspCmdq::nr_ptes` altogether.
With this, `GspArgumentsCached::new` can take a reference to the
`GspCmdq` to initialize from, grab its DMA handle, and initialize
everything else using the constants we defined above. We remove a bunch
of inconsistently-named imports from `gsp.rs`, and replace
firmware-dependent incantations to initialize our GSP arguments with a
single constructor call that tells exactly what it does in a single
line.
On 2025-09-26 at 17:27 +1000, Alexandre Courbot <acourbot@nvidia.com> wrote...
> On Mon Sep 22, 2025 at 8:30 PM JST, Alistair Popple wrote:
> > Initialise the GSP resource manager arguments (rmargs) which provide
> > initialisation parameters to the GSP firmware during boot. The rmargs
> > structure contains arguments to configure the GSP message/command queue
> > location.
> >
> > These are mapped for coherent DMA and added to the libos data structure
> > for access when booting GSP.
> >
> > Signed-off-by: Alistair Popple <apopple@nvidia.com>
> >
> > ---
> >
> > Changes for v2:
> > - Rebased on Alex's latest series
> > ---
> > drivers/gpu/nova-core/gsp.rs | 29 +++++++++++++++-
> > drivers/gpu/nova-core/gsp/cmdq.rs | 14 ++++++--
> > drivers/gpu/nova-core/gsp/fw.rs | 19 +++++++++++
> > .../gpu/nova-core/gsp/fw/r570_144/bindings.rs | 33 +++++++++++++++++++
> > 4 files changed, 91 insertions(+), 4 deletions(-)
> >
> > diff --git a/drivers/gpu/nova-core/gsp.rs b/drivers/gpu/nova-core/gsp.rs
> > index 3d4028d67d2e..bb08bd537ec4 100644
> > --- a/drivers/gpu/nova-core/gsp.rs
> > +++ b/drivers/gpu/nova-core/gsp.rs
> > @@ -17,7 +17,10 @@
> > use crate::fb::FbLayout;
> > use crate::gsp::cmdq::GspCmdq;
> >
> > -use fw::LibosMemoryRegionInitArgument;
> > +use fw::{
> > + LibosMemoryRegionInitArgument, GSP_ARGUMENTS_CACHED, GSP_SR_INIT_ARGUMENTS,
> > + MESSAGE_QUEUE_INIT_ARGUMENTS,
> > +};
> >
> > pub(crate) mod cmdq;
> >
> > @@ -33,6 +36,7 @@ pub(crate) struct Gsp {
> > pub logintr: CoherentAllocation<u8>,
> > pub logrm: CoherentAllocation<u8>,
> > pub cmdq: GspCmdq,
> > + rmargs: CoherentAllocation<GSP_ARGUMENTS_CACHED>,
> > }
> >
> > /// Creates a self-mapping page table for `obj` at its beginning.
> > @@ -90,12 +94,35 @@ pub(crate) fn new(pdev: &pci::Device<device::Bound>) -> Result<impl PinInit<Self
> >
> > // Creates its own PTE array
> > let cmdq = GspCmdq::new(dev)?;
> > + let rmargs =
> > + create_coherent_dma_object::<GSP_ARGUMENTS_CACHED>(dev, "RMARGS", 1, &mut libos, 3)?;
> > + let (shared_mem_phys_addr, cmd_queue_offset, stat_queue_offset) = cmdq.get_cmdq_offsets();
> > +
> > + dma_write!(
> > + rmargs[0].messageQueueInitArguments = MESSAGE_QUEUE_INIT_ARGUMENTS {
> > + sharedMemPhysAddr: shared_mem_phys_addr,
> > + pageTableEntryCount: cmdq.nr_ptes,
> > + cmdQueueOffset: cmd_queue_offset,
> > + statQueueOffset: stat_queue_offset,
> > + ..Default::default()
> > + }
> > + )?;
> > + dma_write!(
> > + rmargs[0].srInitArguments = GSP_SR_INIT_ARGUMENTS {
> > + oldLevel: 0,
> > + flags: 0,
> > + bInPMTransition: 0,
> > + ..Default::default()
> > + }
> > + )?;
> > + dma_write!(rmargs[0].bDmemStack = 1)?;
>
> Wrapping our bindings is going to help clean up this code as well.
>
> First, types named in CAPITALS_SNAKE_CASE are not idiomatic Rust and
> look like constants. And it's not even like the bindings types are
> consistently named that way, since we also have e.g. `GspFwWprMeta` - so
> let's give them a proper public name and bring some consistency at the
> same time.
I think there are two aspects to the bindings - one which was addressed in
the comments for patch 5 is how to abstract them. The other is that the way we
currently generate them results in some ugly name.
Given we want to generate these from our internal IDL eventually I would favour
fixing this naming ugliness by touching up the currently generated bindings. So
maybe I will do that for the next revision.
> This will make all the fields from `GSP_ARGUMENTS_CACHED` invisible to
> this module as they should be, so the wrapping `GspArgumentsCached` type
> should then have a constructor that receives a referene to the command
> queue and takes the information is needs from it, similarly to
> `GspFwWprMeta`. This will reduce the 3 `dma_write!` into a single one.
>
> Then we should remove `get_cmdq_offsets`, which is super confusing. I am
> also not fond of `cmdq.nr_ptes`. More on them below.
I will admit that was a bit of a hack.
> >
> > Ok(try_pin_init!(Self {
> > libos,
> > loginit,
> > logintr,
> > logrm,
> > + rmargs,
> > cmdq,
> > }))
> > }
> > diff --git a/drivers/gpu/nova-core/gsp/cmdq.rs b/drivers/gpu/nova-core/gsp/cmdq.rs
> > index a9ba1a4c73d8..9170ccf4a064 100644
> > --- a/drivers/gpu/nova-core/gsp/cmdq.rs
> > +++ b/drivers/gpu/nova-core/gsp/cmdq.rs
> > @@ -99,7 +99,6 @@ fn new(dev: &device::Device<device::Bound>) -> Result<Self> {
> > Ok(Self(gsp_mem))
> > }
> >
> > - #[expect(unused)]
> > fn dma_handle(&self) -> DmaAddress {
> > self.0.dma_handle()
> > }
> > @@ -218,7 +217,7 @@ pub(crate) struct GspCmdq {
> > dev: ARef<device::Device>,
> > seq: u32,
> > gsp_mem: DmaGspMem,
> > - pub _nr_ptes: u32,
> > + pub nr_ptes: u32,
> > }
> >
> > impl GspCmdq {
> > @@ -231,7 +230,7 @@ pub(crate) fn new(dev: &device::Device<device::Bound>) -> Result<GspCmdq> {
> > dev: dev.into(),
> > seq: 0,
> > gsp_mem,
> > - _nr_ptes: nr_ptes as u32,
> > + nr_ptes: nr_ptes as u32,
> > })
> > }
> >
> > @@ -382,6 +381,15 @@ pub(crate) fn receive_msg_from_gsp<M: GspMessageFromGsp, R>(
> > .advance_cpu_read_ptr(msg_header.rpc.length.div_ceil(GSP_PAGE_SIZE as u32));
> > result
> > }
> > +
> > + pub(crate) fn get_cmdq_offsets(&self) -> (u64, u64, u64) {
> > + (
> > + self.gsp_mem.dma_handle(),
> > + core::mem::offset_of!(Msgq, msgq) as u64,
> > + (core::mem::offset_of!(GspMem, gspq) - core::mem::offset_of!(GspMem, cpuq)
> > + + core::mem::offset_of!(Msgq, msgq)) as u64,
> > + )
> > + }
>
> So this thing returns 3 u64s, one of which is actually a DMA handle,
> while the two others are technically constants. The only thing that
> needs to be inferred at runtime is the DMA handle - all the rest is
> static.
Thanks! That is a useful observation for cleaning these up.
> So we can make the two last returned values associated constants of
> `GspCmdq`:
>
> impl GspCmdq {
> /// Offset of the data after the PTEs.
> const POST_PTE_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq);
>
> /// Offset of command queue ring buffer.
> pub(crate) const CMDQ_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq)
> + core::mem::offset_of!(Msgq, msgq)
> - Self::POST_PTE_OFFSET;
>
> /// Offset of message queue ring buffer.
> pub(crate) const STATQ_OFFSET: usize = core::mem::offset_of!(GspMem, gspq)
> + core::mem::offset_of!(Msgq, msgq)
> - Self::POST_PTE_OFFSET;
>
> `GspArgumentsCached::new` can then import `GspCmdq` and use these to
> initialize its corresponding members.
>
> Remains `nr_ptes`. It was introduced in the previous patch as follows:
>
> let nr_ptes = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
>
> Which turns out to also be a constant! So let's add it next to the others:
>
> impl GspCmdq {
> ...
> /// Number of page table entries for the GSP shared region.
> pub(crate) const NUM_PTES: usize = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
>
> And you can remove `GspCmdq::nr_ptes` altogether.
>
> With this, `GspArgumentsCached::new` can take a reference to the
> `GspCmdq` to initialize from, grab its DMA handle, and initialize
> everything else using the constants we defined above. We remove a bunch
> of inconsistently-named imports from `gsp.rs`, and replace
> firmware-dependent incantations to initialize our GSP arguments with a
> single constructor call that tells exactly what it does in a single
> line.
So this would also live in `fw.rs`? What I'm really concerned about is that if
we're not allowed access the C bindings outside of `fw.rs` then everything ends
up in `fw.rs`, and worse still `fw.rs` basically ends up importing everything as
well, tightly coupling everything into one big blob.
So ugly naming aside, I really can't see the advantage of this. It would seem
much cleaner to have to have gsp.rs import the C bindings it needs and tie that
togeather with the other higher level Gsp abstractions.
Although I agree with the overall sentiment - the code could be better here -
we could still create GspArgumentsCached::new() as you suggest just there's no
reason for it to be in `fw.rs`. The type aliases I had were just to hide the
ugly names really.
On Mon Sep 29, 2025 at 8:36 AM CEST, Alistair Popple wrote:
> On 2025-09-26 at 17:27 +1000, Alexandre Courbot <acourbot@nvidia.com> wrote...
>> On Mon Sep 22, 2025 at 8:30 PM JST, Alistair Popple wrote:
>> > @@ -33,6 +36,7 @@ pub(crate) struct Gsp {
>> > pub logintr: CoherentAllocation<u8>,
>> > pub logrm: CoherentAllocation<u8>,
>> > pub cmdq: GspCmdq,
>> > + rmargs: CoherentAllocation<GSP_ARGUMENTS_CACHED>,
>> > }
>> >
>> > /// Creates a self-mapping page table for `obj` at its beginning.
>> > @@ -90,12 +94,35 @@ pub(crate) fn new(pdev: &pci::Device<device::Bound>) -> Result<impl PinInit<Self
>> >
>> > // Creates its own PTE array
>> > let cmdq = GspCmdq::new(dev)?;
>> > + let rmargs =
>> > + create_coherent_dma_object::<GSP_ARGUMENTS_CACHED>(dev, "RMARGS", 1, &mut libos, 3)?;
>> > + let (shared_mem_phys_addr, cmd_queue_offset, stat_queue_offset) = cmdq.get_cmdq_offsets();
>> > +
>> > + dma_write!(
>> > + rmargs[0].messageQueueInitArguments = MESSAGE_QUEUE_INIT_ARGUMENTS {
>> > + sharedMemPhysAddr: shared_mem_phys_addr,
>> > + pageTableEntryCount: cmdq.nr_ptes,
>> > + cmdQueueOffset: cmd_queue_offset,
>> > + statQueueOffset: stat_queue_offset,
>> > + ..Default::default()
>> > + }
>> > + )?;
>> > + dma_write!(
>> > + rmargs[0].srInitArguments = GSP_SR_INIT_ARGUMENTS {
>> > + oldLevel: 0,
>> > + flags: 0,
>> > + bInPMTransition: 0,
>> > + ..Default::default()
>> > + }
>> > + )?;
>> > + dma_write!(rmargs[0].bDmemStack = 1)?;
>>
>> Wrapping our bindings is going to help clean up this code as well.
>>
>> First, types named in CAPITALS_SNAKE_CASE are not idiomatic Rust and
>> look like constants. And it's not even like the bindings types are
>> consistently named that way, since we also have e.g. `GspFwWprMeta` - so
>> let's give them a proper public name and bring some consistency at the
>> same time.
>
> I think there are two aspects to the bindings - one which was addressed in
> the comments for patch 5 is how to abstract them. The other is that the way we
> currently generate them results in some ugly name.
>
> Given we want to generate these from our internal IDL eventually I would favour
> fixing this naming ugliness by touching up the currently generated bindings. So
> maybe I will do that for the next revision.
It's not about fixing the name of the generated C bindings, it's about not
leaking firmware specific structures into core code of the driver.
Please hide it in an abstraction that can deal with differences between firmware
version internally; see also [1].
[1] https://lore.kernel.org/all/DCUAYNNP97QI.1VOX5XUS9KP7K@kernel.org/
>> This will make all the fields from `GSP_ARGUMENTS_CACHED` invisible to
>> this module as they should be, so the wrapping `GspArgumentsCached` type
>> should then have a constructor that receives a referene to the command
>> queue and takes the information is needs from it, similarly to
>> `GspFwWprMeta`. This will reduce the 3 `dma_write!` into a single one.
>>
>> Then we should remove `get_cmdq_offsets`, which is super confusing. I am
>> also not fond of `cmdq.nr_ptes`. More on them below.
>
> I will admit that was a bit of a hack.
>
>> >
>> > Ok(try_pin_init!(Self {
>> > libos,
>> > loginit,
>> > logintr,
>> > logrm,
>> > + rmargs,
>> > cmdq,
>> > }))
>> > }
>> > diff --git a/drivers/gpu/nova-core/gsp/cmdq.rs b/drivers/gpu/nova-core/gsp/cmdq.rs
>> > index a9ba1a4c73d8..9170ccf4a064 100644
>> > --- a/drivers/gpu/nova-core/gsp/cmdq.rs
>> > +++ b/drivers/gpu/nova-core/gsp/cmdq.rs
>> > @@ -99,7 +99,6 @@ fn new(dev: &device::Device<device::Bound>) -> Result<Self> {
>> > Ok(Self(gsp_mem))
>> > }
>> >
>> > - #[expect(unused)]
>> > fn dma_handle(&self) -> DmaAddress {
>> > self.0.dma_handle()
>> > }
>> > @@ -218,7 +217,7 @@ pub(crate) struct GspCmdq {
>> > dev: ARef<device::Device>,
>> > seq: u32,
>> > gsp_mem: DmaGspMem,
>> > - pub _nr_ptes: u32,
>> > + pub nr_ptes: u32,
>> > }
>> >
>> > impl GspCmdq {
>> > @@ -231,7 +230,7 @@ pub(crate) fn new(dev: &device::Device<device::Bound>) -> Result<GspCmdq> {
>> > dev: dev.into(),
>> > seq: 0,
>> > gsp_mem,
>> > - _nr_ptes: nr_ptes as u32,
>> > + nr_ptes: nr_ptes as u32,
>> > })
>> > }
>> >
>> > @@ -382,6 +381,15 @@ pub(crate) fn receive_msg_from_gsp<M: GspMessageFromGsp, R>(
>> > .advance_cpu_read_ptr(msg_header.rpc.length.div_ceil(GSP_PAGE_SIZE as u32));
>> > result
>> > }
>> > +
>> > + pub(crate) fn get_cmdq_offsets(&self) -> (u64, u64, u64) {
>> > + (
>> > + self.gsp_mem.dma_handle(),
>> > + core::mem::offset_of!(Msgq, msgq) as u64,
>> > + (core::mem::offset_of!(GspMem, gspq) - core::mem::offset_of!(GspMem, cpuq)
>> > + + core::mem::offset_of!(Msgq, msgq)) as u64,
>> > + )
>> > + }
>>
>> So this thing returns 3 u64s, one of which is actually a DMA handle,
>> while the two others are technically constants. The only thing that
>> needs to be inferred at runtime is the DMA handle - all the rest is
>> static.
>
> Thanks! That is a useful observation for cleaning these up.
Please also make sure to use the DmaAddress type instead of a raw u64 for DMA
addresses.
>> So we can make the two last returned values associated constants of
>> `GspCmdq`:
>>
>> impl GspCmdq {
>> /// Offset of the data after the PTEs.
>> const POST_PTE_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq);
>>
>> /// Offset of command queue ring buffer.
>> pub(crate) const CMDQ_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq)
>> + core::mem::offset_of!(Msgq, msgq)
>> - Self::POST_PTE_OFFSET;
>>
>> /// Offset of message queue ring buffer.
>> pub(crate) const STATQ_OFFSET: usize = core::mem::offset_of!(GspMem, gspq)
>> + core::mem::offset_of!(Msgq, msgq)
>> - Self::POST_PTE_OFFSET;
>>
>> `GspArgumentsCached::new` can then import `GspCmdq` and use these to
>> initialize its corresponding members.
>>
>> Remains `nr_ptes`. It was introduced in the previous patch as follows:
>>
>> let nr_ptes = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
>>
>> Which turns out to also be a constant! So let's add it next to the others:
>>
>> impl GspCmdq {
>> ...
>> /// Number of page table entries for the GSP shared region.
>> pub(crate) const NUM_PTES: usize = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
>>
>> And you can remove `GspCmdq::nr_ptes` altogether.
>>
>> With this, `GspArgumentsCached::new` can take a reference to the
>> `GspCmdq` to initialize from, grab its DMA handle, and initialize
>> everything else using the constants we defined above. We remove a bunch
>> of inconsistently-named imports from `gsp.rs`, and replace
>> firmware-dependent incantations to initialize our GSP arguments with a
>> single constructor call that tells exactly what it does in a single
>> line.
>
> So this would also live in `fw.rs`? What I'm really concerned about is that if
> we're not allowed access the C bindings outside of `fw.rs` then everything ends
> up in `fw.rs`, and worse still `fw.rs` basically ends up importing everything as
> well, tightly coupling everything into one big blob.
You can (and probably should) extend the module structure, i.e. add a
sub-directory ./gsp/fw/ and structure things accordingly.
On 2025-09-29 at 17:18 +1000, Danilo Krummrich <dakr@kernel.org> wrote...
> On Mon Sep 29, 2025 at 8:36 AM CEST, Alistair Popple wrote:
> > On 2025-09-26 at 17:27 +1000, Alexandre Courbot <acourbot@nvidia.com> wrote...
> >> On Mon Sep 22, 2025 at 8:30 PM JST, Alistair Popple wrote:
> >> > @@ -33,6 +36,7 @@ pub(crate) struct Gsp {
> >> > pub logintr: CoherentAllocation<u8>,
> >> > pub logrm: CoherentAllocation<u8>,
> >> > pub cmdq: GspCmdq,
> >> > + rmargs: CoherentAllocation<GSP_ARGUMENTS_CACHED>,
> >> > }
> >> >
> >> > /// Creates a self-mapping page table for `obj` at its beginning.
> >> > @@ -90,12 +94,35 @@ pub(crate) fn new(pdev: &pci::Device<device::Bound>) -> Result<impl PinInit<Self
> >> >
> >> > // Creates its own PTE array
> >> > let cmdq = GspCmdq::new(dev)?;
> >> > + let rmargs =
> >> > + create_coherent_dma_object::<GSP_ARGUMENTS_CACHED>(dev, "RMARGS", 1, &mut libos, 3)?;
> >> > + let (shared_mem_phys_addr, cmd_queue_offset, stat_queue_offset) = cmdq.get_cmdq_offsets();
> >> > +
> >> > + dma_write!(
> >> > + rmargs[0].messageQueueInitArguments = MESSAGE_QUEUE_INIT_ARGUMENTS {
> >> > + sharedMemPhysAddr: shared_mem_phys_addr,
> >> > + pageTableEntryCount: cmdq.nr_ptes,
> >> > + cmdQueueOffset: cmd_queue_offset,
> >> > + statQueueOffset: stat_queue_offset,
> >> > + ..Default::default()
> >> > + }
> >> > + )?;
> >> > + dma_write!(
> >> > + rmargs[0].srInitArguments = GSP_SR_INIT_ARGUMENTS {
> >> > + oldLevel: 0,
> >> > + flags: 0,
> >> > + bInPMTransition: 0,
> >> > + ..Default::default()
> >> > + }
> >> > + )?;
> >> > + dma_write!(rmargs[0].bDmemStack = 1)?;
> >>
> >> Wrapping our bindings is going to help clean up this code as well.
> >>
> >> First, types named in CAPITALS_SNAKE_CASE are not idiomatic Rust and
> >> look like constants. And it's not even like the bindings types are
> >> consistently named that way, since we also have e.g. `GspFwWprMeta` - so
> >> let's give them a proper public name and bring some consistency at the
> >> same time.
> >
> > I think there are two aspects to the bindings - one which was addressed in
> > the comments for patch 5 is how to abstract them. The other is that the way we
> > currently generate them results in some ugly name.
> >
> > Given we want to generate these from our internal IDL eventually I would favour
> > fixing this naming ugliness by touching up the currently generated bindings. So
> > maybe I will do that for the next revision.
>
> It's not about fixing the name of the generated C bindings, it's about not
> leaking firmware specific structures into core code of the driver.
I don't disagree. Please see my comments on patch 5, which deals more with the
type of abstraction we want to provide.
> Please hide it in an abstraction that can deal with differences between firmware
> version internally; see also [1].
>
> [1] https://lore.kernel.org/all/DCUAYNNP97QI.1VOX5XUS9KP7K@kernel.org/
>
> >> This will make all the fields from `GSP_ARGUMENTS_CACHED` invisible to
> >> this module as they should be, so the wrapping `GspArgumentsCached` type
> >> should then have a constructor that receives a referene to the command
> >> queue and takes the information is needs from it, similarly to
> >> `GspFwWprMeta`. This will reduce the 3 `dma_write!` into a single one.
> >>
> >> Then we should remove `get_cmdq_offsets`, which is super confusing. I am
> >> also not fond of `cmdq.nr_ptes`. More on them below.
> >
> > I will admit that was a bit of a hack.
> >
> >> >
> >> > Ok(try_pin_init!(Self {
> >> > libos,
> >> > loginit,
> >> > logintr,
> >> > logrm,
> >> > + rmargs,
> >> > cmdq,
> >> > }))
> >> > }
> >> > diff --git a/drivers/gpu/nova-core/gsp/cmdq.rs b/drivers/gpu/nova-core/gsp/cmdq.rs
> >> > index a9ba1a4c73d8..9170ccf4a064 100644
> >> > --- a/drivers/gpu/nova-core/gsp/cmdq.rs
> >> > +++ b/drivers/gpu/nova-core/gsp/cmdq.rs
> >> > @@ -99,7 +99,6 @@ fn new(dev: &device::Device<device::Bound>) -> Result<Self> {
> >> > Ok(Self(gsp_mem))
> >> > }
> >> >
> >> > - #[expect(unused)]
> >> > fn dma_handle(&self) -> DmaAddress {
> >> > self.0.dma_handle()
> >> > }
> >> > @@ -218,7 +217,7 @@ pub(crate) struct GspCmdq {
> >> > dev: ARef<device::Device>,
> >> > seq: u32,
> >> > gsp_mem: DmaGspMem,
> >> > - pub _nr_ptes: u32,
> >> > + pub nr_ptes: u32,
> >> > }
> >> >
> >> > impl GspCmdq {
> >> > @@ -231,7 +230,7 @@ pub(crate) fn new(dev: &device::Device<device::Bound>) -> Result<GspCmdq> {
> >> > dev: dev.into(),
> >> > seq: 0,
> >> > gsp_mem,
> >> > - _nr_ptes: nr_ptes as u32,
> >> > + nr_ptes: nr_ptes as u32,
> >> > })
> >> > }
> >> >
> >> > @@ -382,6 +381,15 @@ pub(crate) fn receive_msg_from_gsp<M: GspMessageFromGsp, R>(
> >> > .advance_cpu_read_ptr(msg_header.rpc.length.div_ceil(GSP_PAGE_SIZE as u32));
> >> > result
> >> > }
> >> > +
> >> > + pub(crate) fn get_cmdq_offsets(&self) -> (u64, u64, u64) {
> >> > + (
> >> > + self.gsp_mem.dma_handle(),
> >> > + core::mem::offset_of!(Msgq, msgq) as u64,
> >> > + (core::mem::offset_of!(GspMem, gspq) - core::mem::offset_of!(GspMem, cpuq)
> >> > + + core::mem::offset_of!(Msgq, msgq)) as u64,
> >> > + )
> >> > + }
> >>
> >> So this thing returns 3 u64s, one of which is actually a DMA handle,
> >> while the two others are technically constants. The only thing that
> >> needs to be inferred at runtime is the DMA handle - all the rest is
> >> static.
> >
> > Thanks! That is a useful observation for cleaning these up.
>
> Please also make sure to use the DmaAddress type instead of a raw u64 for DMA
> addresses.
>
> >> So we can make the two last returned values associated constants of
> >> `GspCmdq`:
> >>
> >> impl GspCmdq {
> >> /// Offset of the data after the PTEs.
> >> const POST_PTE_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq);
> >>
> >> /// Offset of command queue ring buffer.
> >> pub(crate) const CMDQ_OFFSET: usize = core::mem::offset_of!(GspMem, cpuq)
> >> + core::mem::offset_of!(Msgq, msgq)
> >> - Self::POST_PTE_OFFSET;
> >>
> >> /// Offset of message queue ring buffer.
> >> pub(crate) const STATQ_OFFSET: usize = core::mem::offset_of!(GspMem, gspq)
> >> + core::mem::offset_of!(Msgq, msgq)
> >> - Self::POST_PTE_OFFSET;
> >>
> >> `GspArgumentsCached::new` can then import `GspCmdq` and use these to
> >> initialize its corresponding members.
> >>
> >> Remains `nr_ptes`. It was introduced in the previous patch as follows:
> >>
> >> let nr_ptes = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
> >>
> >> Which turns out to also be a constant! So let's add it next to the others:
> >>
> >> impl GspCmdq {
> >> ...
> >> /// Number of page table entries for the GSP shared region.
> >> pub(crate) const NUM_PTES: usize = size_of::<GspMem>() >> GSP_PAGE_SHIFT;
> >>
> >> And you can remove `GspCmdq::nr_ptes` altogether.
> >>
> >> With this, `GspArgumentsCached::new` can take a reference to the
> >> `GspCmdq` to initialize from, grab its DMA handle, and initialize
> >> everything else using the constants we defined above. We remove a bunch
> >> of inconsistently-named imports from `gsp.rs`, and replace
> >> firmware-dependent incantations to initialize our GSP arguments with a
> >> single constructor call that tells exactly what it does in a single
> >> line.
> >
> > So this would also live in `fw.rs`? What I'm really concerned about is that if
> > we're not allowed access the C bindings outside of `fw.rs` then everything ends
> > up in `fw.rs`, and worse still `fw.rs` basically ends up importing everything as
> > well, tightly coupling everything into one big blob.
>
> You can (and probably should) extend the module structure, i.e. add a
> sub-directory ./gsp/fw/ and structure things accordingly.
This is what I thought the gsp directory was for, providing abstractions for the
Gsp. IMHO another layer of abstraction below this seems unnecessary, although
this is discussed in a bit more detail at the end of my comments on patch 5.
© 2016 - 2026 Red Hat, Inc.