Upload MixtralForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +34 -0
- generation_config.json +7 -0
- model-00001-of-00097.safetensors +3 -0
- model-00002-of-00097.safetensors +3 -0
- model-00003-of-00097.safetensors +3 -0
- model-00004-of-00097.safetensors +3 -0
- model-00005-of-00097.safetensors +3 -0
- model-00006-of-00097.safetensors +3 -0
- model-00007-of-00097.safetensors +3 -0
- model-00008-of-00097.safetensors +3 -0
- model-00009-of-00097.safetensors +3 -0
- model-00010-of-00097.safetensors +3 -0
- model-00011-of-00097.safetensors +3 -0
- model-00012-of-00097.safetensors +3 -0
- model-00013-of-00097.safetensors +3 -0
- model-00014-of-00097.safetensors +3 -0
- model-00015-of-00097.safetensors +3 -0
- model-00016-of-00097.safetensors +3 -0
- model-00017-of-00097.safetensors +3 -0
- model-00018-of-00097.safetensors +3 -0
- model-00019-of-00097.safetensors +3 -0
- model-00020-of-00097.safetensors +3 -0
- model-00021-of-00097.safetensors +3 -0
- model-00022-of-00097.safetensors +3 -0
- model-00023-of-00097.safetensors +3 -0
- model-00024-of-00097.safetensors +3 -0
- model-00025-of-00097.safetensors +3 -0
- model-00026-of-00097.safetensors +3 -0
- model-00027-of-00097.safetensors +3 -0
- model-00028-of-00097.safetensors +3 -0
- model-00029-of-00097.safetensors +3 -0
- model-00030-of-00097.safetensors +3 -0
- model-00031-of-00097.safetensors +3 -0
- model-00032-of-00097.safetensors +3 -0
- model-00033-of-00097.safetensors +3 -0
- model-00034-of-00097.safetensors +3 -0
- model-00035-of-00097.safetensors +3 -0
- model-00036-of-00097.safetensors +3 -0
- model-00037-of-00097.safetensors +3 -0
- model-00038-of-00097.safetensors +3 -0
- model-00039-of-00097.safetensors +3 -0
- model-00040-of-00097.safetensors +3 -0
- model-00041-of-00097.safetensors +3 -0
- model-00042-of-00097.safetensors +3 -0
- model-00043-of-00097.safetensors +3 -0
- model-00044-of-00097.safetensors +3 -0
- model-00045-of-00097.safetensors +3 -0
- model-00046-of-00097.safetensors +3 -0
- model-00047-of-00097.safetensors +3 -0
- model-00048-of-00097.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./hydra",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 7168,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 20480,
|
14 |
+
"max_position_embeddings": 200000,
|
15 |
+
"model_type": "mixtral",
|
16 |
+
"num_attention_heads": 56,
|
17 |
+
"num_experts_per_tok": 2,
|
18 |
+
"num_hidden_layers": 60,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"num_local_experts": 4,
|
21 |
+
"output_router_logits": false,
|
22 |
+
"pad_token_id": 0,
|
23 |
+
"pretraining_tp": 1,
|
24 |
+
"rms_norm_eps": 1e-05,
|
25 |
+
"rope_scaling": null,
|
26 |
+
"rope_theta": 5000000.0,
|
27 |
+
"router_aux_loss_coef": 0.001,
|
28 |
+
"sliding_window": null,
|
29 |
+
"tie_word_embeddings": false,
|
30 |
+
"torch_dtype": "float32",
|
31 |
+
"transformers_version": "4.37.2",
|
32 |
+
"use_cache": true,
|
33 |
+
"vocab_size": 64000
|
34 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.37.2"
|
7 |
+
}
|
model-00001-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d117e5879d396c48913485af01eba3d2985f4d2b0a735e5c33f2f9d023c97e48
|
3 |
+
size 4653696216
|
model-00002-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c187c0037c4473881c2d59e4fbec5f33f1b22d9aeb1dc0fb0df8442fd1c871da
|
3 |
+
size 4961920624
|
model-00003-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df80ae0218de635d3b4afebc2abae278f50e603c627b34aa50e65730f3b67d30
|
3 |
+
size 4903257368
|
model-00004-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7845e06b7c3bde58db05f4bdec03b1440111fd5ad952f37d6ee1f51fa386a13
|
3 |
+
size 4580353752
|
model-00005-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c9dde426697cf498efe2dbce4871e4a30ec834c586c95da0453ec1484f4701c
|
3 |
+
size 4697621552
|
model-00006-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4f1dee4d19153effcbd911292ede13d395b2b19f607574d77d65e95991d0fb8
|
3 |
+
size 4580353752
|
model-00007-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:353c3d533235be79cdb2573b6a6f955fc37ad5bb9d21523c830e59e84ddbd673
|
3 |
+
size 4580353752
|
model-00008-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c11b713e442ca8d2532071ce23b999f6784699af013a580475019b82cefdff33
|
3 |
+
size 4697621552
|
model-00009-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e29c64853bdb5556dbe4108e096ab93c416b9ecd5d694f357e274ddbab7b7aff
|
3 |
+
size 4580353752
|
model-00010-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a95dab034af983da2cc85ea8ba019b5f6bb15c10d3f2ea5a3496e44260425c2e
|
3 |
+
size 4961920624
|
model-00011-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d16f26f7cbe76195c1e9f9df87b5ef41b1d0febe73d6135025aa17112c5675e4
|
3 |
+
size 4903257368
|
model-00012-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d58be7dc9bd5d420e0e59cda74e277e9d78f7f038cf33787a5dd0b09fba32e1
|
3 |
+
size 4580353752
|
model-00013-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29968ffa2618c8bbfc742826192d2d0975afdb19dd2b00f55c612ebfcfefa8ca
|
3 |
+
size 4697621552
|
model-00014-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07e0f44eed713e413a83ea3b24f28cbf864f88a41f751ed4d4bce113140539e4
|
3 |
+
size 4580353752
|
model-00015-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50c1ef7e6e0760866e41132062b348be108e851e4620a00c5df356c7994bc4ad
|
3 |
+
size 4580353752
|
model-00016-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d4d5e48f2ec24d260c19c0c8ab1f0ee6eb125903509a4e4cee7863f0cd51e59
|
3 |
+
size 4697621552
|
model-00017-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78f4606e8052d85cc25eaa8ae5892faf457a124fe23e0af03f8140453ef5390e
|
3 |
+
size 4580353760
|
model-00018-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0370859f69e87e71b3a32df6904677817004e1c135b7ae4185303145dc7b723
|
3 |
+
size 4961920640
|
model-00019-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d29eec6483b2296297643ec82a4ab4e4958234c601d25827b0dc655920db918
|
3 |
+
size 4903257384
|
model-00020-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:982ea8472eca941978ede4b3beaa37ef656cff10b688937f82f464ef83a32e8c
|
3 |
+
size 4580353768
|
model-00021-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42a3dc599f71e93c0932f3fa07f633aa53984a8e00ccc93bc39781fb235fa73e
|
3 |
+
size 4697621560
|
model-00022-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44611a57738045b0002cc21c605f2dbb551ba0113b2e25d38c61f21310746249
|
3 |
+
size 4580353760
|
model-00023-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4708648589672bedb8ad090e58660465a53f253768449974773aa6e0cc0dec91
|
3 |
+
size 4580353768
|
model-00024-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6010cc86f4ccd7fa976ff5e22fb82cd683121fa82790b98a41d8733e080c8bcc
|
3 |
+
size 4697621560
|
model-00025-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d7950fb10f239905eac778c7ee8b0eb04d8607a7937e0a7d4da4365242e8167
|
3 |
+
size 4580353768
|
model-00026-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01bb0db0e48759eb12a41073ce6fb6f208f8970f8708000702532b0b7627b598
|
3 |
+
size 4961920640
|
model-00027-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df789d4d89bf412f8915c6c566a1dfac3611ba4b3891c420f679e4b165db400a
|
3 |
+
size 4903257384
|
model-00028-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3ccf04055d41a5be0e6a023d1cfc7200113c195accbd84e63eba53417312db
|
3 |
+
size 4580353768
|
model-00029-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e1f12f9c6f1a700cce7688d00fc495cf32f314ac03c63f668dcdb232b9da7bb
|
3 |
+
size 4697621560
|
model-00030-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df4e0efe8ddeb1f48241e2b0ed04d2569f68106bfb6adadc5ca2b5d0160a68e9
|
3 |
+
size 4580353760
|
model-00031-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:914c8cf16cd88cc697e6593d6830e7a4875b9f96d1ceeef37b82dbc8564fee97
|
3 |
+
size 4580353768
|
model-00032-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67e2e9a15e94ce95d0358c314bc9de11bef393730d661c56dd7a1ca5eae4e682
|
3 |
+
size 4697621560
|
model-00033-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08df07f2b16e3b996a6f9eccd2783fd613b7139a1a8f0651d6af64480827329e
|
3 |
+
size 4580353768
|
model-00034-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41b3439d5a8b3f95dab12dec409616c5f48736c05345b81df5e8d9ea7b22fe1e
|
3 |
+
size 4961920640
|
model-00035-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13fee5f1e157232ed56d5f2320494fcdc434e076b703e5fd8eb4c5794ac1e3c8
|
3 |
+
size 4903257384
|
model-00036-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdd0ae375bd54a079a397a0319abc0936b24ef11d3463f8f31e93cb9ca6f1d4c
|
3 |
+
size 4580353768
|
model-00037-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8ea76ad3a2f40adfe9b7021afdf6879726545fa3b1806937ee6768915964fe7
|
3 |
+
size 4697621560
|
model-00038-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea650fd0198435cc5e2010caa9af3d9de15bd4060015eba0a399107b0df79edd
|
3 |
+
size 4580353760
|
model-00039-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae40622327bf47cd2d2e84a9f46bcf4944285a4f95c4823ab62eaa69a12bd81b
|
3 |
+
size 4580353768
|
model-00040-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b8dc381dbd9802b9c10ef3ea5381b6102ee46f10a03e6bbefbfebd27cc84ff6
|
3 |
+
size 4697621560
|
model-00041-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0351cd7bf9042091ada09c990e8c83b3e522e3b3dc31f5b22d3c7cb7d9b9d15
|
3 |
+
size 4580353768
|
model-00042-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1310b5e2ac89e4706f0f4713eaa25032b3986efe0187fc5093f415c44911b885
|
3 |
+
size 4961920640
|
model-00043-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:342075ad6da780d92d60b7cede87d46624376dd8d652865fa0df1ceed868c718
|
3 |
+
size 4903257384
|
model-00044-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f634c591af16768bd83a48e9e8cfb98dfb989d94e9810659217887a7019354b4
|
3 |
+
size 4580353768
|
model-00045-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cffc69eff23e642a0d32a6cb94f87d866a417b30b8839e8ce3c6c5e38707bb09
|
3 |
+
size 4697621560
|
model-00046-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00f03e395465aa780fee2bfb90058de4b6dfbf142994426e7dcf9ef1378a3c81
|
3 |
+
size 4580353760
|
model-00047-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7278047be5f349a8e57f2778b09afdd95c514f06c82489d49b3795e4392bf6a
|
3 |
+
size 4580353768
|
model-00048-of-00097.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57292da99f26d5d73bb99cb915010b0a70b568d49d9c14d00466cf77c131cfbb
|
3 |
+
size 4697621560
|