at676 commited on
Commit
92fde07
1 Parent(s): d23e6ed

Upload folder using huggingface_hub (#2)

Browse files

- 8e2190dcd8ca77f4ec090bd042aaa3b9b28e7796f03531aba822d65d59440768 (dfc5f05d301e83c7bbccc034c34e2f879755822a)
- 13ce69aa8ff27b301054dc63cd75b90fda003fbfffaacddc83acb215c35da96a (686499b990fb417ff0996c2852566a1552eb33d6)
- 10357b0f603e5be2bd7054b25e31c9d52f52e135bbf340fbb02e61aa748abc39 (b305f5f17251160f5a03d582ca40b26c06ee85e6)
- 8019eab46b499fa66999ba0139ed53be05872a284bb5db33d1fad28f8e06f05b (bbe9acd713983e16bbee96e9c3829c2ad5ef66f8)
- c24fa0ffac45a5e59f322e40a797caa54c62e38b95e2d9abe69ecf0c0738dd23 (35561fda28d97ef7ffedcc99fc5790626937b9b5)
- 1691e233b5cf9768d0124f3a1f2b00881e59c0a212708f4a5a7db8d7932bba16 (c745d526476c6a865abf0324e3991f879939f638)
- 350244a54f2a7cc3f5a6f753fbed219dba08ff6bcf11bd9b7ea905fd295c8cd7 (7f78449b7e8161404e736852933602dae7f25d70)
- 127f9ada11c5f6302756858661324c42b018885570c6fb1306c49a378df133a9 (96d5c7be245c6ada6bc05852c4a8adf2158cc12f)
- a42e2c0b97d017b2376c504eabd5dd0812ccebbb33aecd45b718edfa9e2d5e09 (2bf86f620389d2cc3c9f4afbef0a67b94730119a)
- b9705dfcf9230e248a5d270cd852d101d15f9c12d035d2dce841a68c582a1ecf (b2f315dd59d212c9b64af639c20780a3b5a47fd3)
- 53857526e30b6ca40400d5859bc2c5bdfc6bc76bebffb0030eda168210195633 (bcfdf49a83af13e48156f601bf3e09752f083c52)
- cc3e37235a3d0bbfbdbe30c89e2000551bb6df66755ba3d5a58e803be4c12f8f (aee456d60c2e297e97b690399d82ac6520da9d41)
- 77beb9534ac061baf7c9529b90a44d34511404cad404a35cd5ad1e9d4248facc (75345a9189a04c8aac4d278e005dc5c41e48325f)
- 82483d9661d58d4d1852e79ccc52b4ec47a77b64ee2c7debb0ae1bf163aa003f (0f70fafa18920204c1c30416d9e0730c45292b57)
- 39ec7dbee6304b376613e44d7c103f6cd107ddb83ea207b51708af9200b36eb0 (7173458e0b9e3029b00a39623101002f3934ee99)
- 5b4c6d009aeac4cb5821c080ad2d0c17d2a412e4474cf167832951c9fa70208e (7ed864b61e0b0fd024badc3aaa51ec98ca2f5c47)
- 93726c91f7804da607f1a57f24e4a6c5d7225cee6c5bc1c61892451637541de9 (4341ebe2427e8d1c6aae6a6668abb0d4275d171f)
- 275c401e04d35144d291c0ac660ccba3b820193c066ce86394e49a84f054d9b2 (653b74c43aec9186b2a10879ac56bd1084c33165)
- e2d7fd59fc8f84a52a77a93c975b7135d1b69a3145874880abd0cdd85f1f8041 (6103180376025eb078d323736495743e713e70c0)
- 52a7d7936a8aaf9c72558fbbcc44e6508166176b3828e1fbb266e91d4e4772e5 (6467b123bc3c3a4b2201afae467b99ac6ed4b62a)
- 0bb9d8f81c430bfa3663c31ebaf875d0c5abde9a07e8597ddf526fbf3cb4457d (1b430c28d6eb43392203d3d14673015b9d6e5c5a)
- b1d216d3af51b5acd6906a197b4492169682a37d18f79dcce2752f2386eea92d (93b5c95aa43cd6108b156ef193ed2b70f4ae76a0)
- 61e36debba634af1130dd4cdda2adf6d5dae189ba2897f2ad4a4ac5f82d31d02 (01f49b96b1b908216b3a39c5fc90e9cda3a6ef4a)
- 2a26697cf22812930c46865659cb1f7e6ccb59274bd339a21af9b50fd6eddca5 (31be7ecc46c3bc7d1836f04a0dfb8e90d78a49e7)
- 234f48105908d805877a5f4515e0c4040b0a0a5668b904dce77629fbaf410dab (93f3931c81c22fe7baf4bae59ca55883c7a118f5)
- 3ad5a08ff36044b70ce9fa962d78c465c2df540eb2ea90e951480f77a1de0c23 (59bf3d8727d2e8e232dec3806c87bc2a712ae9ba)
- 7f0655a17ad0af7d161872887ae2820288adad285cfc692dda44a83f75dd62c4 (23b5632f7f62c7bff6e9883baca7530c49e29ebc)
- 98950f0bfc1291c5a02625607cdae5f89c17c53e9ab9a26c94f03adafbffe716 (e935af5dfb5975fcfaac9fc11714d340d4623237)
- 0e753ca875559ed03d609960aedc452dec500b6bcadefc5fd7025f79bc90b16c (fa4bf428f5856650e0a79b86e0863b47d77cc9ca)
- b93d8a7b0601238a09e597123a9d6e94f6c50d0aa30f0340ec8b45d1a5a364ad (0987ef1a40e09ca797c81b3d7ce4a77fcbdbbd1b)
- bdbc3d0298e45f2cd4f778fb4c99d339a4c3b8a0035f54411e7f527d26d6678d (e146f5d60220119aeb5a31b79e58ce4ce0da199e)
- c47d220cefdfe2981241cc4b6aad7b8e40fabc2d33d2992688148b25cf3dde5e (6e25b52ad402a5dd3f4523b7b99901f0237428e9)
- c6b6de80a11cf4403f54326d3971e046628487fc0e336b52bc44799a19522abd (4bbad7a3a7cc3662e14354daba328d86f7e24514)
- ccce89e942af70a99075ab97a84a63b3b9b0d9d86071031c3fccc551a975070c (d8d3a421732f3b88a26f0796034e739df68b0725)

config.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "meta-llama/Meta-Llama-3.1-405B-Instruct",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": [
10
+ 128001,
11
+ 128008,
12
+ 128009
13
+ ],
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 16384,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 53248,
19
+ "max_position_embeddings": 131072,
20
+ "mlp_bias": false,
21
+ "model_type": "llama",
22
+ "num_attention_heads": 128,
23
+ "num_hidden_layers": 126,
24
+ "num_key_value_heads": 8,
25
+ "pretraining_tp": 1,
26
+ "quip_params": {
27
+ "K": 3,
28
+ "L": 16,
29
+ "V": 2,
30
+ "codebook": "bitshift",
31
+ "codebook_version": 0,
32
+ "decode_mode": "quantlut_sym",
33
+ "split_for_tp": true,
34
+ "td_x": 16,
35
+ "td_y": 16,
36
+ "tlut_bits": 9
37
+ },
38
+ "rms_norm_eps": 1e-05,
39
+ "rope_scaling": {
40
+ "factor": 8.0,
41
+ "high_freq_factor": 4.0,
42
+ "low_freq_factor": 1.0,
43
+ "original_max_position_embeddings": 8192,
44
+ "rope_type": "llama3"
45
+ },
46
+ "rope_theta": 500000.0,
47
+ "tie_word_embeddings": false,
48
+ "torch_dtype": "bfloat16",
49
+ "transformers_version": "4.45.2",
50
+ "use_cache": true,
51
+ "vocab_size": 128256
52
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.45.2"
12
+ }
model-00001-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8c917dcdc276eb70bef2a46721a83091ab551eeb291e99d340eeffecf50991f
3
+ size 4744289776
model-00002-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7eb1c945146f52f2a15f92fffbd6f90bf32b59e26a9a638e7af3362e40a0226b
3
+ size 4785579736
model-00003-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60a61ea38e7fa7c3314e6f33e9cd2220cb080d74f83aa0f4b811d4672d7945e2
3
+ size 4785579736
model-00004-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e9b96bf2f7cdb3bf51d2f7337dd411afcf8a5b599dc48b4a7485acf0854d493
3
+ size 4785579856
model-00005-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31626c1a285a6dcea890f28e9478b58553366b6cf1480be2f43a8780721f6f9d
3
+ size 4785579912
model-00006-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3211aeaa1d51cfc2973d1f574f9b2126f7fd3b4bab1f6ed353193fa855483775
3
+ size 4785579912
model-00007-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2e2978ad58ecad35f0ab5ae2c39fa927af193ff9b310ef681fa41cf98a62aa3
3
+ size 4785579912
model-00008-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87cc6f4c7aaa6e8a491c963447d6f4c545340bb09535b1fbcb547cfd6b54433f
3
+ size 4785579912
model-00009-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f703f14dd352af3a2f7a8c0c92150c8b93b9226d0ed2267f223c69ca2bd1ff5
3
+ size 4785579912
model-00010-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:998c305d6a53f753f28233f18124c28466c73549f795a72c85ee5c85939739cf
3
+ size 4785579912
model-00011-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f503cb69f9f615284bb794df883348c5252c03d87a1a588459bb411e215345b
3
+ size 4785579912
model-00012-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c73b2a88e4ebabcc9a29f61226b88e677b9f6bbe5f8360d7243efc350b56c49
3
+ size 4785579912
model-00013-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ee7ff77231860d33d1542655234ef5240dfb4f7a1cdf54a61a97b633db6e801
3
+ size 4785579912
model-00014-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:703eee83cf6e33e31db9ef2b1d55348b0e0b944d565b8fd0ac7f859242b5db8a
3
+ size 4785579912
model-00015-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed8dc51f9c90d9fc69e450ac038f0763428b74bf2366d046e751282e11728e5c
3
+ size 4785579912
model-00016-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4775acc45a96a543dc546c301dab8bce0743e89f4d19a2a0cb05306711ee2a7c
3
+ size 4785579912
model-00017-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77e111583abfabd070838b602353e0508182b411a29bd48654fa9597db4065ce
3
+ size 4785579912
model-00018-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1310b13685ea71f4f1a44818320d874bae5a0871bf569f3c2e1d9e4fe3907040
3
+ size 4785579912
model-00019-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72abe511a4033935b7f0587143ff2dba6517aadcdb37e4ff4bb689fcda0c228a
3
+ size 4785579912
model-00020-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa823cf5a40880bcbeba39b8ff37d62354bf4df77629a65ed15e6f25a29f9b04
3
+ size 4785579912
model-00021-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab52dab01cbb0ec1398698248eedc70b1f2278d2942ee3806a08c990d03a241a
3
+ size 4785579912
model-00022-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06418c6c667ca4445ecb4cf0da244b368e2b38556929a0d7dd9e7c569c00a5f6
3
+ size 4785579912
model-00023-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3fa229890d1788ebd3668c967d08e9db7038f6f77e88dc1f17a5b72e6451ec8
3
+ size 4785579912
model-00024-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e24c1841c1197c86117b8caf5c0544bb4b59234331efb0e568ea6ef3bac24aa
3
+ size 4785579912
model-00025-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17bb9c81382b39a1bdda7e37f3147691f5480f757b1d68483a2842518d84d629
3
+ size 4785579912
model-00026-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3904590a62f7b31969d940aa5de38a35f0c2e8573a9983bcf46d487ade5a597
3
+ size 4785579936
model-00027-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c65d60592f907f6afc6c1cb2a762e1f6f7b678e2a728bfef53dee0028e994e2
3
+ size 4785580088
model-00028-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e530a4ae5bfb460c3bdff294c35da19bb7f4e39ffd34937e536565b3b7ebc4c
3
+ size 4785580088
model-00029-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ace55e9768cafa03a400beefcda03ff661088d8fa8e68004eb30660389214ff8
3
+ size 4785580088
model-00030-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:919f8be272b4625ad871ef6f2698bf4fc19229a50ffe3d10f39f0eef3503d5ec
3
+ size 4785580088
model-00031-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3691afc5db7eb1489d5561593953ae1959504b2e7f92cde9bef817d1f7af30f
3
+ size 4785580088
model-00032-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f1b2df01c3638054194742dfc4cecdf58049afa72b84a00d0e65d3023239e65
3
+ size 4785580088
model-00033-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2e52c41500676ca8a00a1910e6341bbdcadb6eb15fc5fc36adb653758d2b0e4
3
+ size 1851225824
model-00034-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
3
+ size 4202692736
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff