Skip to content

Commit

Permalink
Get Mamba2 working!
Browse files Browse the repository at this point in the history
Signed-off-by: Tyler Michael Smith <[email protected]>
  • Loading branch information
tlrmchlsmth committed Jan 16, 2025
1 parent c956a30 commit 17923ad
Show file tree
Hide file tree
Showing 4 changed files with 940 additions and 2 deletions.
2 changes: 0 additions & 2 deletions vllm/model_executor/layers/mamba/mamba_mixer2.py
Original file line number Diff line number Diff line change
Expand Up @@ -174,7 +174,6 @@ def __init__(self,
intermediate_size: int,
use_conv_bias: bool,
use_bias: bool,
use_rms_norm: bool,
n_groups: int = 1,
num_heads: int = 128,
head_dim: int = 64,
Expand Down Expand Up @@ -203,7 +202,6 @@ def __init__(self,
"Tensor parallel world size must divide num heads."

self.ssm_state_size = ssm_state_size
self.use_rms_norm = use_rms_norm
self.activation = activation

self.chunk_size = chunk_size
Expand Down
Loading

0 comments on commit 17923ad

Please sign in to comment.