mirror of https://github.com/torvalds/linux.git
313 lines
8.7 KiB
Rust
313 lines
8.7 KiB
Rust
// SPDX-License-Identifier: GPL-2.0
|
|
|
|
use kernel::{device, devres::Devres, error::code::*, pci, prelude::*, sync::Arc};
|
|
|
|
use crate::driver::Bar0;
|
|
use crate::falcon::{gsp::Gsp, sec2::Sec2, Falcon};
|
|
use crate::fb::FbLayout;
|
|
use crate::fb::SysmemFlush;
|
|
use crate::firmware::fwsec::{FwsecCommand, FwsecFirmware};
|
|
use crate::firmware::{Firmware, FIRMWARE_VERSION};
|
|
use crate::gfw;
|
|
use crate::regs;
|
|
use crate::util;
|
|
use crate::vbios::Vbios;
|
|
use core::fmt;
|
|
|
|
macro_rules! define_chipset {
|
|
({ $($variant:ident = $value:expr),* $(,)* }) =>
|
|
{
|
|
/// Enum representation of the GPU chipset.
|
|
#[derive(fmt::Debug, Copy, Clone, PartialOrd, Ord, PartialEq, Eq)]
|
|
pub(crate) enum Chipset {
|
|
$($variant = $value),*,
|
|
}
|
|
|
|
impl Chipset {
|
|
pub(crate) const ALL: &'static [Chipset] = &[
|
|
$( Chipset::$variant, )*
|
|
];
|
|
|
|
pub(crate) const NAMES: [&'static str; Self::ALL.len()] = [
|
|
$( util::const_bytes_to_str(
|
|
util::to_lowercase_bytes::<{ stringify!($variant).len() }>(
|
|
stringify!($variant)
|
|
).as_slice()
|
|
), )*
|
|
];
|
|
}
|
|
|
|
// TODO[FPRI]: replace with something like derive(FromPrimitive)
|
|
impl TryFrom<u32> for Chipset {
|
|
type Error = kernel::error::Error;
|
|
|
|
fn try_from(value: u32) -> Result<Self, Self::Error> {
|
|
match value {
|
|
$( $value => Ok(Chipset::$variant), )*
|
|
_ => Err(ENODEV),
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
define_chipset!({
|
|
// Turing
|
|
TU102 = 0x162,
|
|
TU104 = 0x164,
|
|
TU106 = 0x166,
|
|
TU117 = 0x167,
|
|
TU116 = 0x168,
|
|
// Ampere
|
|
GA100 = 0x170,
|
|
GA102 = 0x172,
|
|
GA103 = 0x173,
|
|
GA104 = 0x174,
|
|
GA106 = 0x176,
|
|
GA107 = 0x177,
|
|
// Ada
|
|
AD102 = 0x192,
|
|
AD103 = 0x193,
|
|
AD104 = 0x194,
|
|
AD106 = 0x196,
|
|
AD107 = 0x197,
|
|
});
|
|
|
|
impl Chipset {
|
|
pub(crate) fn arch(&self) -> Architecture {
|
|
match self {
|
|
Self::TU102 | Self::TU104 | Self::TU106 | Self::TU117 | Self::TU116 => {
|
|
Architecture::Turing
|
|
}
|
|
Self::GA100 | Self::GA102 | Self::GA103 | Self::GA104 | Self::GA106 | Self::GA107 => {
|
|
Architecture::Ampere
|
|
}
|
|
Self::AD102 | Self::AD103 | Self::AD104 | Self::AD106 | Self::AD107 => {
|
|
Architecture::Ada
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// TODO
|
|
//
|
|
// The resulting strings are used to generate firmware paths, hence the
|
|
// generated strings have to be stable.
|
|
//
|
|
// Hence, replace with something like strum_macros derive(Display).
|
|
//
|
|
// For now, redirect to fmt::Debug for convenience.
|
|
impl fmt::Display for Chipset {
|
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
|
write!(f, "{self:?}")
|
|
}
|
|
}
|
|
|
|
/// Enum representation of the GPU generation.
|
|
#[derive(fmt::Debug)]
|
|
pub(crate) enum Architecture {
|
|
Turing = 0x16,
|
|
Ampere = 0x17,
|
|
Ada = 0x19,
|
|
}
|
|
|
|
impl TryFrom<u8> for Architecture {
|
|
type Error = Error;
|
|
|
|
fn try_from(value: u8) -> Result<Self> {
|
|
match value {
|
|
0x16 => Ok(Self::Turing),
|
|
0x17 => Ok(Self::Ampere),
|
|
0x19 => Ok(Self::Ada),
|
|
_ => Err(ENODEV),
|
|
}
|
|
}
|
|
}
|
|
|
|
pub(crate) struct Revision {
|
|
major: u8,
|
|
minor: u8,
|
|
}
|
|
|
|
impl Revision {
|
|
fn from_boot0(boot0: regs::NV_PMC_BOOT_0) -> Self {
|
|
Self {
|
|
major: boot0.major_revision(),
|
|
minor: boot0.minor_revision(),
|
|
}
|
|
}
|
|
}
|
|
|
|
impl fmt::Display for Revision {
|
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
|
write!(f, "{:x}.{:x}", self.major, self.minor)
|
|
}
|
|
}
|
|
|
|
/// Structure holding the metadata of the GPU.
|
|
pub(crate) struct Spec {
|
|
chipset: Chipset,
|
|
/// The revision of the chipset.
|
|
revision: Revision,
|
|
}
|
|
|
|
impl Spec {
|
|
fn new(bar: &Bar0) -> Result<Spec> {
|
|
let boot0 = regs::NV_PMC_BOOT_0::read(bar);
|
|
|
|
Ok(Self {
|
|
chipset: boot0.chipset()?,
|
|
revision: Revision::from_boot0(boot0),
|
|
})
|
|
}
|
|
}
|
|
|
|
/// Structure holding the resources required to operate the GPU.
|
|
#[pin_data(PinnedDrop)]
|
|
pub(crate) struct Gpu {
|
|
spec: Spec,
|
|
/// MMIO mapping of PCI BAR 0
|
|
bar: Arc<Devres<Bar0>>,
|
|
fw: Firmware,
|
|
/// System memory page required for flushing all pending GPU-side memory writes done through
|
|
/// PCIE into system memory, via sysmembar (A GPU-initiated HW memory-barrier operation).
|
|
sysmem_flush: SysmemFlush,
|
|
}
|
|
|
|
#[pinned_drop]
|
|
impl PinnedDrop for Gpu {
|
|
fn drop(self: Pin<&mut Self>) {
|
|
// Unregister the sysmem flush page before we release it.
|
|
self.bar
|
|
.try_access_with(|b| self.sysmem_flush.unregister(b));
|
|
}
|
|
}
|
|
|
|
impl Gpu {
|
|
/// Helper function to load and run the FWSEC-FRTS firmware and confirm that it has properly
|
|
/// created the WPR2 region.
|
|
///
|
|
/// TODO: this needs to be moved into a larger type responsible for booting the whole GSP
|
|
/// (`GspBooter`?).
|
|
fn run_fwsec_frts(
|
|
dev: &device::Device<device::Bound>,
|
|
falcon: &Falcon<Gsp>,
|
|
bar: &Bar0,
|
|
bios: &Vbios,
|
|
fb_layout: &FbLayout,
|
|
) -> Result<()> {
|
|
// Check that the WPR2 region does not already exists - if it does, we cannot run
|
|
// FWSEC-FRTS until the GPU is reset.
|
|
if regs::NV_PFB_PRI_MMU_WPR2_ADDR_HI::read(bar).higher_bound() != 0 {
|
|
dev_err!(
|
|
dev,
|
|
"WPR2 region already exists - GPU needs to be reset to proceed\n"
|
|
);
|
|
return Err(EBUSY);
|
|
}
|
|
|
|
let fwsec_frts = FwsecFirmware::new(
|
|
dev,
|
|
falcon,
|
|
bar,
|
|
bios,
|
|
FwsecCommand::Frts {
|
|
frts_addr: fb_layout.frts.start,
|
|
frts_size: fb_layout.frts.end - fb_layout.frts.start,
|
|
},
|
|
)?;
|
|
|
|
// Run FWSEC-FRTS to create the WPR2 region.
|
|
fwsec_frts.run(dev, falcon, bar)?;
|
|
|
|
// SCRATCH_E contains the error code for FWSEC-FRTS.
|
|
let frts_status = regs::NV_PBUS_SW_SCRATCH_0E::read(bar).frts_err_code();
|
|
if frts_status != 0 {
|
|
dev_err!(
|
|
dev,
|
|
"FWSEC-FRTS returned with error code {:#x}",
|
|
frts_status
|
|
);
|
|
|
|
return Err(EIO);
|
|
}
|
|
|
|
// Check that the WPR2 region has been created as we requested.
|
|
let (wpr2_lo, wpr2_hi) = (
|
|
regs::NV_PFB_PRI_MMU_WPR2_ADDR_LO::read(bar).lower_bound(),
|
|
regs::NV_PFB_PRI_MMU_WPR2_ADDR_HI::read(bar).higher_bound(),
|
|
);
|
|
|
|
match (wpr2_lo, wpr2_hi) {
|
|
(_, 0) => {
|
|
dev_err!(dev, "WPR2 region not created after running FWSEC-FRTS\n");
|
|
|
|
Err(EIO)
|
|
}
|
|
(wpr2_lo, _) if wpr2_lo != fb_layout.frts.start => {
|
|
dev_err!(
|
|
dev,
|
|
"WPR2 region created at unexpected address {:#x}; expected {:#x}\n",
|
|
wpr2_lo,
|
|
fb_layout.frts.start,
|
|
);
|
|
|
|
Err(EIO)
|
|
}
|
|
(wpr2_lo, wpr2_hi) => {
|
|
dev_dbg!(dev, "WPR2: {:#x}-{:#x}\n", wpr2_lo, wpr2_hi);
|
|
dev_dbg!(dev, "GPU instance built\n");
|
|
|
|
Ok(())
|
|
}
|
|
}
|
|
}
|
|
|
|
pub(crate) fn new(
|
|
pdev: &pci::Device<device::Bound>,
|
|
devres_bar: Arc<Devres<Bar0>>,
|
|
) -> Result<impl PinInit<Self>> {
|
|
let bar = devres_bar.access(pdev.as_ref())?;
|
|
let spec = Spec::new(bar)?;
|
|
let fw = Firmware::new(pdev.as_ref(), spec.chipset, FIRMWARE_VERSION)?;
|
|
|
|
dev_info!(
|
|
pdev.as_ref(),
|
|
"NVIDIA (Chipset: {}, Architecture: {:?}, Revision: {})\n",
|
|
spec.chipset,
|
|
spec.chipset.arch(),
|
|
spec.revision
|
|
);
|
|
|
|
// We must wait for GFW_BOOT completion before doing any significant setup on the GPU.
|
|
gfw::wait_gfw_boot_completion(bar)
|
|
.inspect_err(|_| dev_err!(pdev.as_ref(), "GFW boot did not complete"))?;
|
|
|
|
let sysmem_flush = SysmemFlush::register(pdev.as_ref(), bar, spec.chipset)?;
|
|
|
|
let gsp_falcon = Falcon::<Gsp>::new(
|
|
pdev.as_ref(),
|
|
spec.chipset,
|
|
bar,
|
|
spec.chipset > Chipset::GA100,
|
|
)?;
|
|
gsp_falcon.clear_swgen0_intr(bar);
|
|
|
|
let _sec2_falcon = Falcon::<Sec2>::new(pdev.as_ref(), spec.chipset, bar, true)?;
|
|
|
|
let fb_layout = FbLayout::new(spec.chipset, bar)?;
|
|
dev_dbg!(pdev.as_ref(), "{:#x?}\n", fb_layout);
|
|
|
|
let bios = Vbios::new(pdev, bar)?;
|
|
|
|
Self::run_fwsec_frts(pdev.as_ref(), &gsp_falcon, bar, &bios, &fb_layout)?;
|
|
|
|
Ok(pin_init!(Self {
|
|
spec,
|
|
bar: devres_bar,
|
|
fw,
|
|
sysmem_flush,
|
|
}))
|
|
}
|
|
}
|