burn_mamba/mamba3/bidi/naive/mod.rs
1//! Naive implementation where the Mamba3 block is not adapted.
2//!
3//! Two independent layers are executed as a bidi pair,
4//! where the input flip-split happens before the layer normalization,
5//! and they are merged (by a ) after the block output,
6//! before the layer-pair skip connection.
7
8mod layer;
9mod output_merge;
10
11pub use layer::{
12 Mamba3BidiLayerPair, Mamba3BidiLayerPairConfig, Mamba3BidiLayers, Mamba3BidiLayersConfig,
13};
14pub use output_merge::{OutputMerge, OutputMergeConfig};