mirror of
https://github.com/torvalds/linux.git
synced 2026-04-18 06:44:00 -04:00
Up until now, only the GSP required parsing of its firmware headers. However, upcoming support for Hopper/Blackwell+ adds another firmware image (FMC), along with another format (ELF32). Therefore, the current ELF64 section parsing support needs to be moved up a level, so that both of the above can use it. There are no functional changes. This is pure code movement. Reviewed-by: Gary Guo <gary@garyguo.net> Signed-off-by: John Hubbard <jhubbard@nvidia.com> Acked-by: Danilo Krummrich <dakr@kernel.org> Link: https://patch.msgid.link/20260326013902.588242-8-jhubbard@nvidia.com [acourbot: use fuller prefix in commit message.] Signed-off-by: Alexandre Courbot <acourbot@nvidia.com>
185 lines
6.9 KiB
Rust
185 lines
6.9 KiB
Rust
// SPDX-License-Identifier: GPL-2.0
|
|
|
|
use kernel::{
|
|
device,
|
|
dma::{
|
|
Coherent,
|
|
CoherentBox,
|
|
DataDirection,
|
|
DmaAddress, //
|
|
},
|
|
prelude::*,
|
|
scatterlist::{
|
|
Owned,
|
|
SGTable, //
|
|
},
|
|
};
|
|
|
|
use crate::{
|
|
firmware::{
|
|
elf,
|
|
riscv::RiscvFirmware, //
|
|
},
|
|
gpu::{
|
|
Architecture,
|
|
Chipset, //
|
|
},
|
|
gsp::GSP_PAGE_SIZE,
|
|
num::FromSafeCast,
|
|
};
|
|
|
|
/// GSP firmware with 3-level radix page tables for the GSP bootloader.
|
|
///
|
|
/// The bootloader expects firmware to be mapped starting at address 0 in GSP's virtual address
|
|
/// space:
|
|
///
|
|
/// ```text
|
|
/// Level 0: 1 page, 1 entry -> points to first level 1 page
|
|
/// Level 1: Multiple pages/entries -> each entry points to a level 2 page
|
|
/// Level 2: Multiple pages/entries -> each entry points to a firmware page
|
|
/// ```
|
|
///
|
|
/// Each page is 4KB, each entry is 8 bytes (64-bit DMA address).
|
|
/// Also known as "Radix3" firmware.
|
|
#[pin_data]
|
|
pub(crate) struct GspFirmware {
|
|
/// The GSP firmware inside a [`VVec`], device-mapped via a SG table.
|
|
#[pin]
|
|
fw: SGTable<Owned<VVec<u8>>>,
|
|
/// Level 2 page table whose entries contain DMA addresses of firmware pages.
|
|
#[pin]
|
|
level2: SGTable<Owned<VVec<u8>>>,
|
|
/// Level 1 page table whose entries contain DMA addresses of level 2 pages.
|
|
#[pin]
|
|
level1: SGTable<Owned<VVec<u8>>>,
|
|
/// Level 0 page table (single 4KB page) with one entry: DMA address of first level 1 page.
|
|
level0: Coherent<[u64]>,
|
|
/// Size in bytes of the firmware contained in [`Self::fw`].
|
|
pub(crate) size: usize,
|
|
/// Device-mapped GSP signatures matching the GPU's [`Chipset`].
|
|
pub(crate) signatures: Coherent<[u8]>,
|
|
/// GSP bootloader, verifies the GSP firmware before loading and running it.
|
|
pub(crate) bootloader: RiscvFirmware,
|
|
}
|
|
|
|
impl GspFirmware {
|
|
/// Loads the GSP firmware binaries, map them into `dev`'s address-space, and creates the page
|
|
/// tables expected by the GSP bootloader to load it.
|
|
pub(crate) fn new<'a>(
|
|
dev: &'a device::Device<device::Bound>,
|
|
chipset: Chipset,
|
|
ver: &'a str,
|
|
) -> impl PinInit<Self, Error> + 'a {
|
|
pin_init::pin_init_scope(move || {
|
|
let firmware = super::request_firmware(dev, chipset, "gsp", ver)?;
|
|
|
|
let fw_section = elf::elf64_section(firmware.data(), ".fwimage").ok_or(EINVAL)?;
|
|
|
|
let size = fw_section.len();
|
|
|
|
// Move the firmware into a vmalloc'd vector and map it into the device address
|
|
// space.
|
|
let fw_vvec = VVec::with_capacity(fw_section.len(), GFP_KERNEL)
|
|
.and_then(|mut v| {
|
|
v.extend_from_slice(fw_section, GFP_KERNEL)?;
|
|
Ok(v)
|
|
})
|
|
.map_err(|_| ENOMEM)?;
|
|
|
|
Ok(try_pin_init!(Self {
|
|
fw <- SGTable::new(dev, fw_vvec, DataDirection::ToDevice, GFP_KERNEL),
|
|
level2 <- {
|
|
// Allocate the level 2 page table, map the firmware onto it, and map it into
|
|
// the device address space.
|
|
VVec::<u8>::with_capacity(
|
|
fw.iter().count() * core::mem::size_of::<u64>(),
|
|
GFP_KERNEL,
|
|
)
|
|
.map_err(|_| ENOMEM)
|
|
.and_then(|level2| map_into_lvl(&fw, level2))
|
|
.map(|level2| SGTable::new(dev, level2, DataDirection::ToDevice, GFP_KERNEL))?
|
|
},
|
|
level1 <- {
|
|
// Allocate the level 1 page table, map the level 2 page table onto it, and map
|
|
// it into the device address space.
|
|
VVec::<u8>::with_capacity(
|
|
level2.iter().count() * core::mem::size_of::<u64>(),
|
|
GFP_KERNEL,
|
|
)
|
|
.map_err(|_| ENOMEM)
|
|
.and_then(|level1| map_into_lvl(&level2, level1))
|
|
.map(|level1| SGTable::new(dev, level1, DataDirection::ToDevice, GFP_KERNEL))?
|
|
},
|
|
level0: {
|
|
// Allocate the level 0 page table as a device-visible DMA object, and map the
|
|
// level 1 page table onto it.
|
|
|
|
// Fill level 1 page entry.
|
|
let level1_entry = level1.iter().next().ok_or(EINVAL)?;
|
|
let level1_entry_addr = level1_entry.dma_address();
|
|
|
|
// Create level 0 page table data and fill its first entry with the level 1
|
|
// table.
|
|
let mut level0 = CoherentBox::<[u64]>::zeroed_slice(
|
|
dev,
|
|
GSP_PAGE_SIZE / size_of::<u64>(),
|
|
GFP_KERNEL
|
|
)?;
|
|
level0[0] = level1_entry_addr.to_le();
|
|
|
|
level0.into()
|
|
},
|
|
size,
|
|
signatures: {
|
|
let sigs_section = match chipset.arch() {
|
|
Architecture::Turing
|
|
if matches!(chipset, Chipset::TU116 | Chipset::TU117) =>
|
|
{
|
|
".fwsignature_tu11x"
|
|
}
|
|
Architecture::Turing => ".fwsignature_tu10x",
|
|
// GA100 uses the same firmware as Turing
|
|
Architecture::Ampere if chipset == Chipset::GA100 => ".fwsignature_tu10x",
|
|
Architecture::Ampere => ".fwsignature_ga10x",
|
|
Architecture::Ada => ".fwsignature_ad10x",
|
|
};
|
|
|
|
elf::elf64_section(firmware.data(), sigs_section)
|
|
.ok_or(EINVAL)
|
|
.and_then(|data| Coherent::from_slice(dev, data, GFP_KERNEL))?
|
|
},
|
|
bootloader: {
|
|
let bl = super::request_firmware(dev, chipset, "bootloader", ver)?;
|
|
|
|
RiscvFirmware::new(dev, &bl)?
|
|
},
|
|
}))
|
|
})
|
|
}
|
|
|
|
/// Returns the DMA handle of the radix3 level 0 page table.
|
|
pub(crate) fn radix3_dma_handle(&self) -> DmaAddress {
|
|
self.level0.dma_handle()
|
|
}
|
|
}
|
|
|
|
/// Build a page table from a scatter-gather list.
|
|
///
|
|
/// Takes each DMA-mapped region from `sg_table` and writes page table entries
|
|
/// for all 4KB pages within that region. For example, a 16KB SG entry becomes
|
|
/// 4 consecutive page table entries.
|
|
fn map_into_lvl(sg_table: &SGTable<Owned<VVec<u8>>>, mut dst: VVec<u8>) -> Result<VVec<u8>> {
|
|
for sg_entry in sg_table.iter() {
|
|
// Number of pages we need to map.
|
|
let num_pages = usize::from_safe_cast(sg_entry.dma_len()).div_ceil(GSP_PAGE_SIZE);
|
|
|
|
for i in 0..num_pages {
|
|
let entry = sg_entry.dma_address()
|
|
+ (u64::from_safe_cast(i) * u64::from_safe_cast(GSP_PAGE_SIZE));
|
|
dst.extend_from_slice(&entry.to_le_bytes(), GFP_KERNEL)?;
|
|
}
|
|
}
|
|
|
|
Ok(dst)
|
|
}
|