Upload folder using huggingface_hub
Browse files- README.md +1 -1
- config.json +1 -1
README.md
CHANGED
|
@@ -30,7 +30,7 @@ config.intermediate_size = 16
|
|
| 30 |
config.num_attention_heads = 4
|
| 31 |
config.num_hidden_layers = 16
|
| 32 |
config.num_key_value_heads = 2
|
| 33 |
-
config.use_mamba_kernels = False
|
| 34 |
|
| 35 |
model = AutoModelForCausalLM.from_config(
|
| 36 |
config, torch_dtype=torch.bfloat16, attn_implementation="sdpa", trust_remote_code=True
|
|
|
|
| 30 |
config.num_attention_heads = 4
|
| 31 |
config.num_hidden_layers = 16
|
| 32 |
config.num_key_value_heads = 2
|
| 33 |
+
# config.use_mamba_kernels = False
|
| 34 |
|
| 35 |
model = AutoModelForCausalLM.from_config(
|
| 36 |
config, torch_dtype=torch.bfloat16, attn_implementation="sdpa", trust_remote_code=True
|
config.json
CHANGED
|
@@ -40,6 +40,6 @@
|
|
| 40 |
"torch_dtype": "bfloat16",
|
| 41 |
"transformers_version": "4.44.0",
|
| 42 |
"use_cache": true,
|
| 43 |
-
"use_mamba_kernels":
|
| 44 |
"vocab_size": 65536
|
| 45 |
}
|
|
|
|
| 40 |
"torch_dtype": "bfloat16",
|
| 41 |
"transformers_version": "4.44.0",
|
| 42 |
"use_cache": true,
|
| 43 |
+
"use_mamba_kernels": true,
|
| 44 |
"vocab_size": 65536
|
| 45 |
}
|