pub struct Model { /* private fields */ }Expand description
Mamba model weights and inference kernels.
Implementations§
Source§impl Model
impl Model
Sourcepub fn new_full_adam_state(&self) -> FullAdamState
pub fn new_full_adam_state(&self) -> FullAdamState
Allocate zero-initialized Adam moments matching all trainable tensors.
Sourcepub fn new_random(cfg: Config, seed: u64) -> Result<Self>
pub fn new_random(cfg: Config, seed: u64) -> Result<Self>
Build a deterministic random model for online-mode workflows.
Sourcepub fn save_safetensors<P: AsRef<Path>>(&self, path: P) -> Result<()>
pub fn save_safetensors<P: AsRef<Path>>(&self, path: P) -> Result<()>
Save checkpoint to safetensors (native infotheory Mamba layout).
Sourcepub fn save_full_adam_safetensors<P: AsRef<Path>>(
&self,
adam: &FullAdamState,
path: P,
) -> Result<()>
pub fn save_full_adam_safetensors<P: AsRef<Path>>( &self, adam: &FullAdamState, path: P, ) -> Result<()>
Save full-parameter Adam moments for exact online-training continuation.
Sourcepub fn load_full_adam_safetensors<P: AsRef<Path>>(
&self,
path: P,
) -> Result<FullAdamState>
pub fn load_full_adam_safetensors<P: AsRef<Path>>( &self, path: P, ) -> Result<FullAdamState>
Load full-parameter Adam moments and validate tensor shapes.
Sourcepub fn lm_head_weights(&self) -> &[f32]
pub fn lm_head_weights(&self) -> &[f32]
Immutable LM-head weights, row-major (vocab, hidden).
Sourcepub fn lm_head_weights_mut(&mut self) -> &mut [f32]
pub fn lm_head_weights_mut(&mut self) -> &mut [f32]
Mutable LM-head weights, row-major (vocab, hidden).
Sourcepub fn online_train_segment_tbptt(
&mut self,
scratch: &mut ScratchBuffers,
start_state: &State,
steps: &[(u32, u8, Vec<f64>)],
scope: TrainScopeMask,
optimizer: OptimizerKind,
lr: f32,
clip: f32,
replay_chunk: usize,
adam_t: &mut usize,
model_adam: Option<&mut FullAdamState>,
out_bias: Option<&mut [f32]>,
out_bias_adam_m: Option<&mut [f32]>,
out_bias_adam_v: Option<&mut [f32]>,
live_state_out: &mut State,
) -> Result<()>
pub fn online_train_segment_tbptt( &mut self, scratch: &mut ScratchBuffers, start_state: &State, steps: &[(u32, u8, Vec<f64>)], scope: TrainScopeMask, optimizer: OptimizerKind, lr: f32, clip: f32, replay_chunk: usize, adam_t: &mut usize, model_adam: Option<&mut FullAdamState>, out_bias: Option<&mut [f32]>, out_bias_adam_m: Option<&mut [f32]>, out_bias_adam_v: Option<&mut [f32]>, live_state_out: &mut State, ) -> Result<()>
Run one TBPTT training segment and write the resulting live state.
Sourcepub fn forward<'a>(
&'a self,
scratch: &'a mut ScratchBuffers,
token: u32,
state: &mut State,
) -> &'a [f32]
pub fn forward<'a>( &'a self, scratch: &'a mut ScratchBuffers, token: u32, state: &mut State, ) -> &'a [f32]
Forward a single byte token and return logits for next symbol.
Sourcepub fn online_train_step_bptt1(
&mut self,
scratch: &mut ScratchBuffers,
state: &State,
symbol: u8,
pdf: &[f64],
scope: TrainScopeMask,
optimizer: OptimizerKind,
lr: f32,
clip: f32,
adam_t: &mut usize,
model_adam: Option<&mut FullAdamState>,
out_bias: Option<&mut [f32]>,
out_bias_adam_m: Option<&mut [f32]>,
out_bias_adam_v: Option<&mut [f32]>,
) -> Result<()>
pub fn online_train_step_bptt1( &mut self, scratch: &mut ScratchBuffers, state: &State, symbol: u8, pdf: &[f64], scope: TrainScopeMask, optimizer: OptimizerKind, lr: f32, clip: f32, adam_t: &mut usize, model_adam: Option<&mut FullAdamState>, out_bias: Option<&mut [f32]>, out_bias_adam_m: Option<&mut [f32]>, out_bias_adam_v: Option<&mut [f32]>, ) -> Result<()>
Exact single-step (bptt=1) online training for all Mamba parameters.
This consumes the latest forward trace captured in scratch and applies
one gradient step using the externally provided PDF/target symbol.
Trait Implementations§
Auto Trait Implementations§
impl Freeze for Model
impl RefUnwindSafe for Model
impl Send for Model
impl Sync for Model
impl Unpin for Model
impl UnwindSafe for Model
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
§impl<T> Conv for T
impl<T> Conv for T
§impl<T> FmtForward for T
impl<T> FmtForward for T
§fn fmt_binary(self) -> FmtBinary<Self>where
Self: Binary,
fn fmt_binary(self) -> FmtBinary<Self>where
Self: Binary,
self to use its Binary implementation when Debug-formatted.§fn fmt_display(self) -> FmtDisplay<Self>where
Self: Display,
fn fmt_display(self) -> FmtDisplay<Self>where
Self: Display,
self to use its Display implementation when
Debug-formatted.§fn fmt_lower_exp(self) -> FmtLowerExp<Self>where
Self: LowerExp,
fn fmt_lower_exp(self) -> FmtLowerExp<Self>where
Self: LowerExp,
self to use its LowerExp implementation when
Debug-formatted.§fn fmt_lower_hex(self) -> FmtLowerHex<Self>where
Self: LowerHex,
fn fmt_lower_hex(self) -> FmtLowerHex<Self>where
Self: LowerHex,
self to use its LowerHex implementation when
Debug-formatted.§fn fmt_octal(self) -> FmtOctal<Self>where
Self: Octal,
fn fmt_octal(self) -> FmtOctal<Self>where
Self: Octal,
self to use its Octal implementation when Debug-formatted.§fn fmt_pointer(self) -> FmtPointer<Self>where
Self: Pointer,
fn fmt_pointer(self) -> FmtPointer<Self>where
Self: Pointer,
self to use its Pointer implementation when
Debug-formatted.§fn fmt_upper_exp(self) -> FmtUpperExp<Self>where
Self: UpperExp,
fn fmt_upper_exp(self) -> FmtUpperExp<Self>where
Self: UpperExp,
self to use its UpperExp implementation when
Debug-formatted.§fn fmt_upper_hex(self) -> FmtUpperHex<Self>where
Self: UpperHex,
fn fmt_upper_hex(self) -> FmtUpperHex<Self>where
Self: UpperHex,
self to use its UpperHex implementation when
Debug-formatted.§fn fmt_list(self) -> FmtList<Self>where
&'a Self: for<'a> IntoIterator,
fn fmt_list(self) -> FmtList<Self>where
&'a Self: for<'a> IntoIterator,
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more§impl<T> Pipe for Twhere
T: ?Sized,
impl<T> Pipe for Twhere
T: ?Sized,
§fn pipe<R>(self, func: impl FnOnce(Self) -> R) -> Rwhere
Self: Sized,
fn pipe<R>(self, func: impl FnOnce(Self) -> R) -> Rwhere
Self: Sized,
§fn pipe_ref<'a, R>(&'a self, func: impl FnOnce(&'a Self) -> R) -> Rwhere
R: 'a,
fn pipe_ref<'a, R>(&'a self, func: impl FnOnce(&'a Self) -> R) -> Rwhere
R: 'a,
self and passes that borrow into the pipe function. Read more§fn pipe_ref_mut<'a, R>(&'a mut self, func: impl FnOnce(&'a mut Self) -> R) -> Rwhere
R: 'a,
fn pipe_ref_mut<'a, R>(&'a mut self, func: impl FnOnce(&'a mut Self) -> R) -> Rwhere
R: 'a,
self and passes that borrow into the pipe function. Read more§fn pipe_borrow<'a, B, R>(&'a self, func: impl FnOnce(&'a B) -> R) -> R
fn pipe_borrow<'a, B, R>(&'a self, func: impl FnOnce(&'a B) -> R) -> R
§fn pipe_borrow_mut<'a, B, R>(
&'a mut self,
func: impl FnOnce(&'a mut B) -> R,
) -> R
fn pipe_borrow_mut<'a, B, R>( &'a mut self, func: impl FnOnce(&'a mut B) -> R, ) -> R
§fn pipe_as_ref<'a, U, R>(&'a self, func: impl FnOnce(&'a U) -> R) -> R
fn pipe_as_ref<'a, U, R>(&'a self, func: impl FnOnce(&'a U) -> R) -> R
self, then passes self.as_ref() into the pipe function.§fn pipe_as_mut<'a, U, R>(&'a mut self, func: impl FnOnce(&'a mut U) -> R) -> R
fn pipe_as_mut<'a, U, R>(&'a mut self, func: impl FnOnce(&'a mut U) -> R) -> R
self, then passes self.as_mut() into the pipe
function.§fn pipe_deref<'a, T, R>(&'a self, func: impl FnOnce(&'a T) -> R) -> R
fn pipe_deref<'a, T, R>(&'a self, func: impl FnOnce(&'a T) -> R) -> R
self, then passes self.deref() into the pipe function.§impl<T> Pointable for T
impl<T> Pointable for T
§impl<T> Tap for T
impl<T> Tap for T
§fn tap_borrow<B>(self, func: impl FnOnce(&B)) -> Self
fn tap_borrow<B>(self, func: impl FnOnce(&B)) -> Self
Borrow<B> of a value. Read more§fn tap_borrow_mut<B>(self, func: impl FnOnce(&mut B)) -> Self
fn tap_borrow_mut<B>(self, func: impl FnOnce(&mut B)) -> Self
BorrowMut<B> of a value. Read more§fn tap_ref<R>(self, func: impl FnOnce(&R)) -> Self
fn tap_ref<R>(self, func: impl FnOnce(&R)) -> Self
AsRef<R> view of a value. Read more§fn tap_ref_mut<R>(self, func: impl FnOnce(&mut R)) -> Self
fn tap_ref_mut<R>(self, func: impl FnOnce(&mut R)) -> Self
AsMut<R> view of a value. Read more§fn tap_deref<T>(self, func: impl FnOnce(&T)) -> Self
fn tap_deref<T>(self, func: impl FnOnce(&T)) -> Self
Deref::Target of a value. Read more§fn tap_deref_mut<T>(self, func: impl FnOnce(&mut T)) -> Self
fn tap_deref_mut<T>(self, func: impl FnOnce(&mut T)) -> Self
Deref::Target of a value. Read more§fn tap_dbg(self, func: impl FnOnce(&Self)) -> Self
fn tap_dbg(self, func: impl FnOnce(&Self)) -> Self
.tap() only in debug builds, and is erased in release builds.§fn tap_mut_dbg(self, func: impl FnOnce(&mut Self)) -> Self
fn tap_mut_dbg(self, func: impl FnOnce(&mut Self)) -> Self
.tap_mut() only in debug builds, and is erased in release
builds.§fn tap_borrow_dbg<B>(self, func: impl FnOnce(&B)) -> Self
fn tap_borrow_dbg<B>(self, func: impl FnOnce(&B)) -> Self
.tap_borrow() only in debug builds, and is erased in release
builds.§fn tap_borrow_mut_dbg<B>(self, func: impl FnOnce(&mut B)) -> Self
fn tap_borrow_mut_dbg<B>(self, func: impl FnOnce(&mut B)) -> Self
.tap_borrow_mut() only in debug builds, and is erased in release
builds.§fn tap_ref_dbg<R>(self, func: impl FnOnce(&R)) -> Self
fn tap_ref_dbg<R>(self, func: impl FnOnce(&R)) -> Self
.tap_ref() only in debug builds, and is erased in release
builds.§fn tap_ref_mut_dbg<R>(self, func: impl FnOnce(&mut R)) -> Self
fn tap_ref_mut_dbg<R>(self, func: impl FnOnce(&mut R)) -> Self
.tap_ref_mut() only in debug builds, and is erased in release
builds.§fn tap_deref_dbg<T>(self, func: impl FnOnce(&T)) -> Self
fn tap_deref_dbg<T>(self, func: impl FnOnce(&T)) -> Self
.tap_deref() only in debug builds, and is erased in release
builds.