burn_mamba::mamba3::double_ssd::ssd::ssd_path

Struct Mamba3DoubleSsdInput

pub struct Mamba3DoubleSsdInput {
    pub v_bnlmhp: Tensor<6>,
    pub da_bnlh: Tensor<4>,
    pub b_bnlmhr: Tensor<6>,
    pub c_bnlmhr: Tensor<6>,
    pub initial_state_bhpr: Tensor<4>,
    pub init_state_hpr: Option<Tensor<3>>,
}

Expand description

MIMO-first SSD input.

All tensors are pre-processed: B/C are already QK-normed, RoPE-applied, bias-added, and expanded to per-head (not per-group). V is already scaled by the (double-ssd) trapezoidal coefficient (γ or β). The combined log-decay da = Δ·A is pre-computed. D skip is handled by the caller.

Fields§

§v_bnlmhp: Tensor<6>

Value tensor, already scaled by (double-ssd) trapezoidal coefficient (γ or β).

§Shape

[batch, nchunks, chunk_len, mimo_rank, nheads, per_head_dim]

§da_bnlh: Tensor<4>

Pre-combined log-decay Δ·A (negative).

§Shape

[batch, nchunks, chunk_len, nheads]

§b_bnlmhr: Tensor<6>

Key/B tensor: QK-normed, RoPE-applied, bias-added, expanded to per-head, per-rank.

§Shape

[batch, nchunks, chunk_len, mimo_rank, nheads, state_rank]

§c_bnlmhr: Tensor<6>

Query/C tensor: same processing as B.

§Shape

[batch, nchunks, chunk_len, mimo_rank, nheads, state_rank]

§initial_state_bhpr: Tensor<4>

Initial SSM hidden state.

§Shape

[batch, nheads, per_head_dim, state_rank]

§init_state_hpr: Option<Tensor<3>>

Optional learnable initial state (broadcast over batch).

§Shape

[nheads, per_head_dim, state_rank]

Mamba3DoubleSsdInput

Struct Mamba3DoubleSsdInput Copy item path

Fields§

§Shape

§Shape

§Shape

§Shape

§Shape

§Shape

Implementations§

impl Mamba3DoubleSsdInput

pub fn double_ssd_minimal(self) -> (Tensor<6>, Tensor<4>)

§Shapes

impl Mamba3DoubleSsdInput

pub fn double_ssd_serial(self) -> (Tensor<6>, Tensor<4>)

§Returns

impl Mamba3DoubleSsdInput

pub fn double_ssd_serial_recalculated(self) -> (Tensor<6>, Tensor<4>)

§Returns

impl Mamba3DoubleSsdInput

pub fn sanity(&self)

impl Mamba3DoubleSsdInput

pub fn run(self, path: &Mamba3SsdPath) -> (Tensor<6>, Tensor<4>)

§Returns

Auto Trait Implementations§

impl Freeze for Mamba3DoubleSsdInput

impl RefUnwindSafe for Mamba3DoubleSsdInput

impl Send for Mamba3DoubleSsdInput

impl Sync for Mamba3DoubleSsdInput

impl Unpin for Mamba3DoubleSsdInput

impl UnsafeUnpin for Mamba3DoubleSsdInput

impl UnwindSafe for Mamba3DoubleSsdInput

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct Mamba3DoubleSsdInput

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,