Upload folder using huggingface_hub (#2)
Browse files- 8e2190dcd8ca77f4ec090bd042aaa3b9b28e7796f03531aba822d65d59440768 (dfc5f05d301e83c7bbccc034c34e2f879755822a)
- 13ce69aa8ff27b301054dc63cd75b90fda003fbfffaacddc83acb215c35da96a (686499b990fb417ff0996c2852566a1552eb33d6)
- 10357b0f603e5be2bd7054b25e31c9d52f52e135bbf340fbb02e61aa748abc39 (b305f5f17251160f5a03d582ca40b26c06ee85e6)
- 8019eab46b499fa66999ba0139ed53be05872a284bb5db33d1fad28f8e06f05b (bbe9acd713983e16bbee96e9c3829c2ad5ef66f8)
- c24fa0ffac45a5e59f322e40a797caa54c62e38b95e2d9abe69ecf0c0738dd23 (35561fda28d97ef7ffedcc99fc5790626937b9b5)
- 1691e233b5cf9768d0124f3a1f2b00881e59c0a212708f4a5a7db8d7932bba16 (c745d526476c6a865abf0324e3991f879939f638)
- 350244a54f2a7cc3f5a6f753fbed219dba08ff6bcf11bd9b7ea905fd295c8cd7 (7f78449b7e8161404e736852933602dae7f25d70)
- 127f9ada11c5f6302756858661324c42b018885570c6fb1306c49a378df133a9 (96d5c7be245c6ada6bc05852c4a8adf2158cc12f)
- a42e2c0b97d017b2376c504eabd5dd0812ccebbb33aecd45b718edfa9e2d5e09 (2bf86f620389d2cc3c9f4afbef0a67b94730119a)
- b9705dfcf9230e248a5d270cd852d101d15f9c12d035d2dce841a68c582a1ecf (b2f315dd59d212c9b64af639c20780a3b5a47fd3)
- 53857526e30b6ca40400d5859bc2c5bdfc6bc76bebffb0030eda168210195633 (bcfdf49a83af13e48156f601bf3e09752f083c52)
- cc3e37235a3d0bbfbdbe30c89e2000551bb6df66755ba3d5a58e803be4c12f8f (aee456d60c2e297e97b690399d82ac6520da9d41)
- 77beb9534ac061baf7c9529b90a44d34511404cad404a35cd5ad1e9d4248facc (75345a9189a04c8aac4d278e005dc5c41e48325f)
- 82483d9661d58d4d1852e79ccc52b4ec47a77b64ee2c7debb0ae1bf163aa003f (0f70fafa18920204c1c30416d9e0730c45292b57)
- 39ec7dbee6304b376613e44d7c103f6cd107ddb83ea207b51708af9200b36eb0 (7173458e0b9e3029b00a39623101002f3934ee99)
- 5b4c6d009aeac4cb5821c080ad2d0c17d2a412e4474cf167832951c9fa70208e (7ed864b61e0b0fd024badc3aaa51ec98ca2f5c47)
- 93726c91f7804da607f1a57f24e4a6c5d7225cee6c5bc1c61892451637541de9 (4341ebe2427e8d1c6aae6a6668abb0d4275d171f)
- 275c401e04d35144d291c0ac660ccba3b820193c066ce86394e49a84f054d9b2 (653b74c43aec9186b2a10879ac56bd1084c33165)
- e2d7fd59fc8f84a52a77a93c975b7135d1b69a3145874880abd0cdd85f1f8041 (6103180376025eb078d323736495743e713e70c0)
- 52a7d7936a8aaf9c72558fbbcc44e6508166176b3828e1fbb266e91d4e4772e5 (6467b123bc3c3a4b2201afae467b99ac6ed4b62a)
- 0bb9d8f81c430bfa3663c31ebaf875d0c5abde9a07e8597ddf526fbf3cb4457d (1b430c28d6eb43392203d3d14673015b9d6e5c5a)
- b1d216d3af51b5acd6906a197b4492169682a37d18f79dcce2752f2386eea92d (93b5c95aa43cd6108b156ef193ed2b70f4ae76a0)
- 61e36debba634af1130dd4cdda2adf6d5dae189ba2897f2ad4a4ac5f82d31d02 (01f49b96b1b908216b3a39c5fc90e9cda3a6ef4a)
- 2a26697cf22812930c46865659cb1f7e6ccb59274bd339a21af9b50fd6eddca5 (31be7ecc46c3bc7d1836f04a0dfb8e90d78a49e7)
- 234f48105908d805877a5f4515e0c4040b0a0a5668b904dce77629fbaf410dab (93f3931c81c22fe7baf4bae59ca55883c7a118f5)
- 3ad5a08ff36044b70ce9fa962d78c465c2df540eb2ea90e951480f77a1de0c23 (59bf3d8727d2e8e232dec3806c87bc2a712ae9ba)
- 7f0655a17ad0af7d161872887ae2820288adad285cfc692dda44a83f75dd62c4 (23b5632f7f62c7bff6e9883baca7530c49e29ebc)
- 98950f0bfc1291c5a02625607cdae5f89c17c53e9ab9a26c94f03adafbffe716 (e935af5dfb5975fcfaac9fc11714d340d4623237)
- 0e753ca875559ed03d609960aedc452dec500b6bcadefc5fd7025f79bc90b16c (fa4bf428f5856650e0a79b86e0863b47d77cc9ca)
- b93d8a7b0601238a09e597123a9d6e94f6c50d0aa30f0340ec8b45d1a5a364ad (0987ef1a40e09ca797c81b3d7ce4a77fcbdbbd1b)
- bdbc3d0298e45f2cd4f778fb4c99d339a4c3b8a0035f54411e7f527d26d6678d (e146f5d60220119aeb5a31b79e58ce4ce0da199e)
- c47d220cefdfe2981241cc4b6aad7b8e40fabc2d33d2992688148b25cf3dde5e (6e25b52ad402a5dd3f4523b7b99901f0237428e9)
- c6b6de80a11cf4403f54326d3971e046628487fc0e336b52bc44799a19522abd (4bbad7a3a7cc3662e14354daba328d86f7e24514)
- ccce89e942af70a99075ab97a84a63b3b9b0d9d86071031c3fccc551a975070c (d8d3a421732f3b88a26f0796034e739df68b0725)
- config.json +52 -0
- generation_config.json +12 -0
- model-00001-of-00034.safetensors +3 -0
- model-00002-of-00034.safetensors +3 -0
- model-00003-of-00034.safetensors +3 -0
- model-00004-of-00034.safetensors +3 -0
- model-00005-of-00034.safetensors +3 -0
- model-00006-of-00034.safetensors +3 -0
- model-00007-of-00034.safetensors +3 -0
- model-00008-of-00034.safetensors +3 -0
- model-00009-of-00034.safetensors +3 -0
- model-00010-of-00034.safetensors +3 -0
- model-00011-of-00034.safetensors +3 -0
- model-00012-of-00034.safetensors +3 -0
- model-00013-of-00034.safetensors +3 -0
- model-00014-of-00034.safetensors +3 -0
- model-00015-of-00034.safetensors +3 -0
- model-00016-of-00034.safetensors +3 -0
- model-00017-of-00034.safetensors +3 -0
- model-00018-of-00034.safetensors +3 -0
- model-00019-of-00034.safetensors +3 -0
- model-00020-of-00034.safetensors +3 -0
- model-00021-of-00034.safetensors +3 -0
- model-00022-of-00034.safetensors +3 -0
- model-00023-of-00034.safetensors +3 -0
- model-00024-of-00034.safetensors +3 -0
- model-00025-of-00034.safetensors +3 -0
- model-00026-of-00034.safetensors +3 -0
- model-00027-of-00034.safetensors +3 -0
- model-00028-of-00034.safetensors +3 -0
- model-00029-of-00034.safetensors +3 -0
- model-00030-of-00034.safetensors +3 -0
- model-00031-of-00034.safetensors +3 -0
- model-00032-of-00034.safetensors +3 -0
- model-00033-of-00034.safetensors +3 -0
- model-00034-of-00034.safetensors +3 -0
- model.safetensors.index.json +0 -0
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "meta-llama/Meta-Llama-3.1-405B-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"head_dim": 128,
|
15 |
+
"hidden_act": "silu",
|
16 |
+
"hidden_size": 16384,
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 53248,
|
19 |
+
"max_position_embeddings": 131072,
|
20 |
+
"mlp_bias": false,
|
21 |
+
"model_type": "llama",
|
22 |
+
"num_attention_heads": 128,
|
23 |
+
"num_hidden_layers": 126,
|
24 |
+
"num_key_value_heads": 8,
|
25 |
+
"pretraining_tp": 1,
|
26 |
+
"quip_params": {
|
27 |
+
"K": 3,
|
28 |
+
"L": 16,
|
29 |
+
"V": 2,
|
30 |
+
"codebook": "bitshift",
|
31 |
+
"codebook_version": 0,
|
32 |
+
"decode_mode": "quantlut_sym",
|
33 |
+
"split_for_tp": true,
|
34 |
+
"td_x": 16,
|
35 |
+
"td_y": 16,
|
36 |
+
"tlut_bits": 9
|
37 |
+
},
|
38 |
+
"rms_norm_eps": 1e-05,
|
39 |
+
"rope_scaling": {
|
40 |
+
"factor": 8.0,
|
41 |
+
"high_freq_factor": 4.0,
|
42 |
+
"low_freq_factor": 1.0,
|
43 |
+
"original_max_position_embeddings": 8192,
|
44 |
+
"rope_type": "llama3"
|
45 |
+
},
|
46 |
+
"rope_theta": 500000.0,
|
47 |
+
"tie_word_embeddings": false,
|
48 |
+
"torch_dtype": "bfloat16",
|
49 |
+
"transformers_version": "4.45.2",
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 128256
|
52 |
+
}
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 128000,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"temperature": 0.6,
|
10 |
+
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.45.2"
|
12 |
+
}
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8c917dcdc276eb70bef2a46721a83091ab551eeb291e99d340eeffecf50991f
|
3 |
+
size 4744289776
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7eb1c945146f52f2a15f92fffbd6f90bf32b59e26a9a638e7af3362e40a0226b
|
3 |
+
size 4785579736
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60a61ea38e7fa7c3314e6f33e9cd2220cb080d74f83aa0f4b811d4672d7945e2
|
3 |
+
size 4785579736
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e9b96bf2f7cdb3bf51d2f7337dd411afcf8a5b599dc48b4a7485acf0854d493
|
3 |
+
size 4785579856
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31626c1a285a6dcea890f28e9478b58553366b6cf1480be2f43a8780721f6f9d
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3211aeaa1d51cfc2973d1f574f9b2126f7fd3b4bab1f6ed353193fa855483775
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2e2978ad58ecad35f0ab5ae2c39fa927af193ff9b310ef681fa41cf98a62aa3
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87cc6f4c7aaa6e8a491c963447d6f4c545340bb09535b1fbcb547cfd6b54433f
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f703f14dd352af3a2f7a8c0c92150c8b93b9226d0ed2267f223c69ca2bd1ff5
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:998c305d6a53f753f28233f18124c28466c73549f795a72c85ee5c85939739cf
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f503cb69f9f615284bb794df883348c5252c03d87a1a588459bb411e215345b
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c73b2a88e4ebabcc9a29f61226b88e677b9f6bbe5f8360d7243efc350b56c49
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ee7ff77231860d33d1542655234ef5240dfb4f7a1cdf54a61a97b633db6e801
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:703eee83cf6e33e31db9ef2b1d55348b0e0b944d565b8fd0ac7f859242b5db8a
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed8dc51f9c90d9fc69e450ac038f0763428b74bf2366d046e751282e11728e5c
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4775acc45a96a543dc546c301dab8bce0743e89f4d19a2a0cb05306711ee2a7c
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77e111583abfabd070838b602353e0508182b411a29bd48654fa9597db4065ce
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1310b13685ea71f4f1a44818320d874bae5a0871bf569f3c2e1d9e4fe3907040
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72abe511a4033935b7f0587143ff2dba6517aadcdb37e4ff4bb689fcda0c228a
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa823cf5a40880bcbeba39b8ff37d62354bf4df77629a65ed15e6f25a29f9b04
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab52dab01cbb0ec1398698248eedc70b1f2278d2942ee3806a08c990d03a241a
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06418c6c667ca4445ecb4cf0da244b368e2b38556929a0d7dd9e7c569c00a5f6
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3fa229890d1788ebd3668c967d08e9db7038f6f77e88dc1f17a5b72e6451ec8
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e24c1841c1197c86117b8caf5c0544bb4b59234331efb0e568ea6ef3bac24aa
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17bb9c81382b39a1bdda7e37f3147691f5480f757b1d68483a2842518d84d629
|
3 |
+
size 4785579912
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3904590a62f7b31969d940aa5de38a35f0c2e8573a9983bcf46d487ade5a597
|
3 |
+
size 4785579936
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c65d60592f907f6afc6c1cb2a762e1f6f7b678e2a728bfef53dee0028e994e2
|
3 |
+
size 4785580088
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e530a4ae5bfb460c3bdff294c35da19bb7f4e39ffd34937e536565b3b7ebc4c
|
3 |
+
size 4785580088
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ace55e9768cafa03a400beefcda03ff661088d8fa8e68004eb30660389214ff8
|
3 |
+
size 4785580088
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:919f8be272b4625ad871ef6f2698bf4fc19229a50ffe3d10f39f0eef3503d5ec
|
3 |
+
size 4785580088
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3691afc5db7eb1489d5561593953ae1959504b2e7f92cde9bef817d1f7af30f
|
3 |
+
size 4785580088
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f1b2df01c3638054194742dfc4cecdf58049afa72b84a00d0e65d3023239e65
|
3 |
+
size 4785580088
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2e52c41500676ca8a00a1910e6341bbdcadb6eb15fc5fc36adb653758d2b0e4
|
3 |
+
size 1851225824
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
|
3 |
+
size 4202692736
|
The diff for this file is too large to render.
See raw diff
|
|