update config
Browse files- config.json +14 -13
config.json
CHANGED
@@ -19,7 +19,16 @@
|
|
19 |
"num_hidden_layers": 88,
|
20 |
"num_key_value_heads": 8,
|
21 |
"pretraining_tp": 1,
|
22 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
23 |
"model.layers.0.mlp.down_proj": {
|
24 |
"bias": null,
|
25 |
"enable_norm": true,
|
@@ -14803,15 +14812,7 @@
|
|
14803 |
-1,
|
14804 |
16
|
14805 |
]
|
14806 |
-
}
|
14807 |
-
|
14808 |
-
|
14809 |
-
|
14810 |
-
"rope_theta": 1000000.0,
|
14811 |
-
"sliding_window": null,
|
14812 |
-
"tie_word_embeddings": false,
|
14813 |
-
"torch_dtype": "bfloat16",
|
14814 |
-
"transformers_version": "4.45.2",
|
14815 |
-
"use_cache": true,
|
14816 |
-
"vocab_size": 32768
|
14817 |
-
}
|
|
|
19 |
"num_hidden_layers": 88,
|
20 |
"num_key_value_heads": 8,
|
21 |
"pretraining_tp": 1,
|
22 |
+
"rms_norm_eps": 1e-05,
|
23 |
+
"rope_scaling": null,
|
24 |
+
"rope_theta": 1000000.0,
|
25 |
+
"sliding_window": null,
|
26 |
+
"tie_word_embeddings": false,
|
27 |
+
"torch_dtype": "bfloat16",
|
28 |
+
"transformers_version": "4.45.2",
|
29 |
+
"use_cache": true,
|
30 |
+
"vocab_size": 32768,
|
31 |
+
"quantization_config": {
|
32 |
"model.layers.0.mlp.down_proj": {
|
33 |
"bias": null,
|
34 |
"enable_norm": true,
|
|
|
14812 |
-1,
|
14813 |
16
|
14814 |
]
|
14815 |
+
},
|
14816 |
+
"quant_method": "vptq"
|
14817 |
+
}
|
14818 |
+
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|