rwkvzip/rwkv7/mod.rs
1//! High-performance RWKV7 inference kernel for x86_64.
2//!
3//! This module provides a highly optimized RWKV7 implementation specifically
4//! designed for x86_64 CPUs with AVX2/FMA support. No portability fallbacks.
5//!
6//! # Architecture
7//!
8//! - All matrix operations are SIMD-vectorized (AVX2 + FMA)
9//! - State updates use hand-tuned kernel for N=64 head dimension
10//! - Memory layout optimized for cache efficiency
11//! - No external BLAS dependencies
12
13mod kernel;
14mod model;
15mod profiling;
16mod tensor;
17mod weights;
18
19#[cfg(feature = "training")]
20pub mod training;
21
22pub use model::ScratchBuffers;
23pub use model::{Config, Model, State};
24pub use profiling::{LayerProfiler, LayerTiming, NullProfiler, ProfilerSink};
25pub use tensor::{Tensor1D, Tensor2D, TensorView1D, TensorView2D};
26pub use weights::Weights;