ArthurZ
/

mamba-790m

Text Generation

text-generation-inference

Model card Files Files and versions

ArthurZ HF Staff commited on Feb 29, 2024

Commit

b791109

·

verified ·

1 Parent(s): 852f0be

Upload MambaForCausalLM

Files changed (2) hide show

config.json +2 -2
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -5,7 +5,7 @@
   ],
   "bos_token_id": 1,
   "conv_kernel": 4,
-  "d_model": 1536,
   "eos_token_id": 2,
   "expand": 2,
   "fused_add_norm": true,
@@ -16,7 +16,7 @@
   "layer_norm_epsilon": 1e-05,
   "model_type": "mamba",
   "n_layer": 48,
-  "num_hidden_layers": 32,
   "pad_vocab_size_multiple": 8,
   "residual_in_fp32": true,
   "rms_norm": true,

   ],
   "bos_token_id": 1,
   "conv_kernel": 4,
+  "d_model": 2048,
   "eos_token_id": 2,
   "expand": 2,
   "fused_add_norm": true,
   "layer_norm_epsilon": 1e-05,
   "model_type": "mamba",
   "n_layer": 48,
+  "num_hidden_layers": 48,
   "pad_vocab_size_multiple": 8,
   "residual_in_fp32": true,
   "rms_norm": true,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ed41bdb3582ac8312606e0413024d0265769003f9519505f4373e50a01d553a
-size 1112273944

 version https://git-lfs.github.com/spec/v1
+oid sha256:ebcfe054512122da4d54f83c3422a1c82cdd7788398ca0ddac6963c1aaa3071f
+size 1591179496