Upload MixtralForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +34 -0
- generation_config.json +8 -0
- model-00001-of-00201.safetensors +3 -0
- model-00002-of-00201.safetensors +3 -0
- model-00003-of-00201.safetensors +3 -0
- model-00004-of-00201.safetensors +3 -0
- model-00005-of-00201.safetensors +3 -0
- model-00006-of-00201.safetensors +3 -0
- model-00007-of-00201.safetensors +3 -0
- model-00008-of-00201.safetensors +3 -0
- model-00009-of-00201.safetensors +3 -0
- model-00010-of-00201.safetensors +3 -0
- model-00011-of-00201.safetensors +3 -0
- model-00012-of-00201.safetensors +3 -0
- model-00013-of-00201.safetensors +3 -0
- model-00014-of-00201.safetensors +3 -0
- model-00015-of-00201.safetensors +3 -0
- model-00016-of-00201.safetensors +3 -0
- model-00017-of-00201.safetensors +3 -0
- model-00018-of-00201.safetensors +3 -0
- model-00019-of-00201.safetensors +3 -0
- model-00020-of-00201.safetensors +3 -0
- model-00021-of-00201.safetensors +3 -0
- model-00022-of-00201.safetensors +3 -0
- model-00023-of-00201.safetensors +3 -0
- model-00024-of-00201.safetensors +3 -0
- model-00025-of-00201.safetensors +3 -0
- model-00026-of-00201.safetensors +3 -0
- model-00027-of-00201.safetensors +3 -0
- model-00028-of-00201.safetensors +3 -0
- model-00029-of-00201.safetensors +3 -0
- model-00030-of-00201.safetensors +3 -0
- model-00031-of-00201.safetensors +3 -0
- model-00032-of-00201.safetensors +3 -0
- model-00033-of-00201.safetensors +3 -0
- model-00034-of-00201.safetensors +3 -0
- model-00035-of-00201.safetensors +3 -0
- model-00036-of-00201.safetensors +3 -0
- model-00037-of-00201.safetensors +3 -0
- model-00038-of-00201.safetensors +3 -0
- model-00039-of-00201.safetensors +3 -0
- model-00040-of-00201.safetensors +3 -0
- model-00041-of-00201.safetensors +3 -0
- model-00042-of-00201.safetensors +3 -0
- model-00043-of-00201.safetensors +3 -0
- model-00044-of-00201.safetensors +3 -0
- model-00045-of-00201.safetensors +3 -0
- model-00046-of-00201.safetensors +3 -0
- model-00047-of-00201.safetensors +3 -0
- model-00048-of-00201.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./gianthydra",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "mixtral",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_experts_per_tok": 2,
|
18 |
+
"num_hidden_layers": 80,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"num_local_experts": 4,
|
21 |
+
"output_router_logits": false,
|
22 |
+
"pad_token_id": 0,
|
23 |
+
"pretraining_tp": 1,
|
24 |
+
"rms_norm_eps": 1e-05,
|
25 |
+
"rope_scaling": null,
|
26 |
+
"rope_theta": 10000.0,
|
27 |
+
"router_aux_loss_coef": 0.001,
|
28 |
+
"sliding_window": null,
|
29 |
+
"tie_word_embeddings": false,
|
30 |
+
"torch_dtype": "float32",
|
31 |
+
"transformers_version": "4.37.2",
|
32 |
+
"use_cache": false,
|
33 |
+
"vocab_size": 32000
|
34 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.37.2",
|
7 |
+
"use_cache": false
|
8 |
+
}
|
model-00001-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:510176a48d72902ac5ecb133257286150049b0dd61f56c4ab1b0dc792c2eddb9
|
3 |
+
size 4471260248
|
model-00002-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca1d723e8af07415a60a5ed59fe26841558d463c7fa18bb1397d66715e3afec6
|
3 |
+
size 4697621160
|
model-00003-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70b9ff8d8387de3432a3f691924e78a4f71812c6acb6e52f39820b30e08c8a23
|
3 |
+
size 4362274128
|
model-00004-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90d54ac75e956eac7cbc7d2c5c1d491b4ca0fc7de3bd73b4bff4e313667ee35b
|
3 |
+
size 4697621160
|
model-00005-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdac281289add341da239eee538d139d334af921d29a12885462be7391b7a6e3
|
3 |
+
size 4697621160
|
model-00006-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ee21f0110b662a3e699bcc01f61f103e38d22d08e7f2f0aa468b80540aa3013
|
3 |
+
size 4362274128
|
model-00007-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6daf30af231e1d2184c53726f6f99aafa7da6811e5ec2d8e1b279d4aa950910
|
3 |
+
size 4697621160
|
model-00008-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ff61de5aba6feee62fa32c33125f3ea147ad6d2f486093ec2f27266c20b500f
|
3 |
+
size 4999677048
|
model-00009-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6344d7c963091c486b7ed07e100b838484b5bce79dcd73efc5e79de3a8ec1cb2
|
3 |
+
size 4999742472
|
model-00010-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:174da2e4365d1ed5e09e4e0129f599ac6f6ce7d0772e638ca9fefb0b3628e8e9
|
3 |
+
size 4697621160
|
model-00011-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c7e41230bbc6f75a2da7e7a26ffcc4d411132a1955b30511f9a44a3b1f70c4e
|
3 |
+
size 4362274128
|
model-00012-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52813b32615f5e77bc170fe69e0a5c96feb2ea994ad0f4d69a7a27e5877b4255
|
3 |
+
size 4697621160
|
model-00013-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3411dfbe187eb9f27d9ede2faa51d9bf6501cae55b5c45fcdd53018c94400d2
|
3 |
+
size 4999677048
|
model-00014-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3607b0a308a6d0a6e7f1cc82c88195ba9650760d547fed64a294084bbe8c0903
|
3 |
+
size 4999742472
|
model-00015-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8b4cbc134e17e8d4761b2b93ee827f0dbaac072c4006b5e133835a1af3820b8
|
3 |
+
size 4697621160
|
model-00016-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:387438f39f6d93f67d76806e0e1ee08fadf34cced4c58d8517827de99f8ac910
|
3 |
+
size 4362274128
|
model-00017-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acc7d1efccfb33e7dee4312bd4b267c1c58ca4202c24402048b5f7597b4823f7
|
3 |
+
size 4697621160
|
model-00018-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faabc9f5889c35689f15380c5570051b1ff97ad555a9aa5e4b1acfdba378b3ee
|
3 |
+
size 4999677048
|
model-00019-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c491dd97738beb840e2be54b18b4e4ac361e75bfa4ee2a93e36931db73b9d76
|
3 |
+
size 4999742472
|
model-00020-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3cf13479f07de09e166369906dedc73e8a4c4aa1b8dd8bf9c912bda7f97dad7
|
3 |
+
size 4697621160
|
model-00021-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb3b2b9164e1fe8dfd1798b85284192041ee7bc4819e39472e7c1441c32d2c7b
|
3 |
+
size 4362274128
|
model-00022-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c0e26dd8f9e9e4d09ad0bd3111910d4c3a10efeb1d10ea9a39f82099c61b134
|
3 |
+
size 4697621160
|
model-00023-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebf6a944439c121af7a10f9f7f38ab48e314b90743ff2ab1d47dd865d06a60fe
|
3 |
+
size 4999677048
|
model-00024-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:622a7b55ea6b40dc825a3261834080bb0b48b5f748594528adca93c4bd258027
|
3 |
+
size 4999742472
|
model-00025-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:280f460e27719b2d4bbc86f23ced27c4b7e1ecc01a9ec902c8c1a6d8483572b8
|
3 |
+
size 4697621160
|
model-00026-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b91b968ce35564a5a793d153cc41acc3ebe34cc1c2978bd16447018b1a8cb00
|
3 |
+
size 4362274136
|
model-00027-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:470c380514cc20e7cd763b9bc42e1b0858242c4fadba6581f9d4838903c6bd27
|
3 |
+
size 4697621168
|
model-00028-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:482edf2b7e445f9829c0ab2d6f9ce30f4fc92ee524a66e8843cf1230db5f8b3c
|
3 |
+
size 4999677056
|
model-00029-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1ac89f7c7b7ceb8c9ae29771395607a501f845dfadfdeaefeb08521606f9520
|
3 |
+
size 4999742480
|
model-00030-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7335ac561a2732ca8e1a933256b591723adc81213eca6582e7585697b46736c6
|
3 |
+
size 4697621168
|
model-00031-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:849cf8779c007f802b1c00491bc9443055a718d5fb079c72d8ce47d1633b4858
|
3 |
+
size 4362274144
|
model-00032-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e67ded99b4290ae672e255160725659f9d895fbccac23584246bbfbbceadbd54
|
3 |
+
size 4697621168
|
model-00033-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a488f2af2430764200760f2cf7b015dc1f9b1c8f257182de28f24f8b476a6e02
|
3 |
+
size 4999677056
|
model-00034-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a261940d3cdfc7ec7874722eb8a92a3088bbdb217bd916af80e05351ec16fa4
|
3 |
+
size 4999742480
|
model-00035-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12681f117d6fda8f0147bee0ea4ca39a7e7195d8ab3f2c899e819f11e0192917
|
3 |
+
size 4697621168
|
model-00036-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca6d8bf5f153aa79addaedb6a5676f588e9b96f00413ed871dbbe77ee17fc3b7
|
3 |
+
size 4362274144
|
model-00037-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61305834df92f9db558276beccc0ffea8368f60fe5f5e866f7bd3fda726bc55c
|
3 |
+
size 4697621168
|
model-00038-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3a1975d6701a159ea79fb46dcb6879e227b3f0f9e470882544f37065a25268f
|
3 |
+
size 4999677056
|
model-00039-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96ea3217d2d650785c19e9ee7c15bcc79b4d26306c06ee84e03e2da301579d8a
|
3 |
+
size 4999742480
|
model-00040-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73a581abee18103482961cd171f97118ee7de6a0808783d5cfb498118f44fb74
|
3 |
+
size 4697621168
|
model-00041-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8296e2f117ed7ed953c18c5c1605d50505a3e8e11c6545cf76e108f67b11ebea
|
3 |
+
size 4362274144
|
model-00042-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:589a45e0722415cb79fe6cadc9b1d0ecc30f998c2ee0928dc7ba385b69e135d7
|
3 |
+
size 4697621168
|
model-00043-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08e1765cfb4c65d6e898e3d567f0dfb985167117ab5dafd1f773b3250ed5f409
|
3 |
+
size 4999677056
|
model-00044-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c739a03f221cb5653856d1c4842b6fc225e28f52f5573d85fc032b5a1687a77f
|
3 |
+
size 4999742480
|
model-00045-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:760ef5a75be203f04d5a823afb56095a92e906678acb2343316cffea94b1d6d6
|
3 |
+
size 4697621168
|
model-00046-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:776d0670887a11c19c3818d5edaadd51a95c516a97626f386ce11d4756cf84d1
|
3 |
+
size 4362274144
|
model-00047-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:739a9e9f62b3d10f47344534d44659914d1ef052c8fd1c431bbd1aa603350b79
|
3 |
+
size 4697621168
|
model-00048-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16d24b31e322d96479f3337daa952ed65ca487b7cd69043f00796c0bf1048db2
|
3 |
+
size 4999677056
|