readd architectures, mpt
Browse files- config.json +7 -1
config.json
CHANGED
|
@@ -1,4 +1,7 @@
|
|
| 1 |
{
|
|
|
|
|
|
|
|
|
|
| 2 |
"attention_dropout": 0.0,
|
| 3 |
"bos_token_id": 200034,
|
| 4 |
"eos_token_id": 200020,
|
|
@@ -40,5 +43,8 @@
|
|
| 40 |
"tie_word_embeddings": false,
|
| 41 |
"transformers_version": "5.0.0.dev0",
|
| 42 |
"use_cache": true,
|
| 43 |
-
"vocab_size": 200064
|
|
|
|
|
|
|
|
|
|
| 44 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"MiniMaxM2ForCausalLM"
|
| 4 |
+
],
|
| 5 |
"attention_dropout": 0.0,
|
| 6 |
"bos_token_id": 200034,
|
| 7 |
"eos_token_id": 200020,
|
|
|
|
| 43 |
"tie_word_embeddings": false,
|
| 44 |
"transformers_version": "5.0.0.dev0",
|
| 45 |
"use_cache": true,
|
| 46 |
+
"vocab_size": 200064,
|
| 47 |
+
"mtp_transformer_layers": 1,
|
| 48 |
+
"num_mtp_modules": 3,
|
| 49 |
+
"use_mtp": true
|
| 50 |
}
|