Upload folder using huggingface_hub

#2
Files changed (47) hide show
  1. config.json +52 -0
  2. generation_config.json +12 -0
  3. model-00001-of-00044.safetensors +3 -0
  4. model-00002-of-00044.safetensors +3 -0
  5. model-00003-of-00044.safetensors +3 -0
  6. model-00004-of-00044.safetensors +3 -0
  7. model-00005-of-00044.safetensors +3 -0
  8. model-00006-of-00044.safetensors +3 -0
  9. model-00007-of-00044.safetensors +3 -0
  10. model-00008-of-00044.safetensors +3 -0
  11. model-00009-of-00044.safetensors +3 -0
  12. model-00010-of-00044.safetensors +3 -0
  13. model-00011-of-00044.safetensors +3 -0
  14. model-00012-of-00044.safetensors +3 -0
  15. model-00013-of-00044.safetensors +3 -0
  16. model-00014-of-00044.safetensors +3 -0
  17. model-00015-of-00044.safetensors +3 -0
  18. model-00016-of-00044.safetensors +3 -0
  19. model-00017-of-00044.safetensors +3 -0
  20. model-00018-of-00044.safetensors +3 -0
  21. model-00019-of-00044.safetensors +3 -0
  22. model-00020-of-00044.safetensors +3 -0
  23. model-00021-of-00044.safetensors +3 -0
  24. model-00022-of-00044.safetensors +3 -0
  25. model-00023-of-00044.safetensors +3 -0
  26. model-00024-of-00044.safetensors +3 -0
  27. model-00025-of-00044.safetensors +3 -0
  28. model-00026-of-00044.safetensors +3 -0
  29. model-00027-of-00044.safetensors +3 -0
  30. model-00028-of-00044.safetensors +3 -0
  31. model-00029-of-00044.safetensors +3 -0
  32. model-00030-of-00044.safetensors +3 -0
  33. model-00031-of-00044.safetensors +3 -0
  34. model-00032-of-00044.safetensors +3 -0
  35. model-00033-of-00044.safetensors +3 -0
  36. model-00034-of-00044.safetensors +3 -0
  37. model-00035-of-00044.safetensors +3 -0
  38. model-00036-of-00044.safetensors +3 -0
  39. model-00037-of-00044.safetensors +3 -0
  40. model-00038-of-00044.safetensors +3 -0
  41. model-00039-of-00044.safetensors +3 -0
  42. model-00040-of-00044.safetensors +3 -0
  43. model-00041-of-00044.safetensors +3 -0
  44. model-00042-of-00044.safetensors +3 -0
  45. model-00043-of-00044.safetensors +3 -0
  46. model-00044-of-00044.safetensors +3 -0
  47. model.safetensors.index.json +0 -0
config.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "meta-llama/Meta-Llama-3.1-405B-Instruct",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": [
10
+ 128001,
11
+ 128008,
12
+ 128009
13
+ ],
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 16384,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 53248,
19
+ "max_position_embeddings": 131072,
20
+ "mlp_bias": false,
21
+ "model_type": "llama",
22
+ "num_attention_heads": 128,
23
+ "num_hidden_layers": 126,
24
+ "num_key_value_heads": 8,
25
+ "pretraining_tp": 1,
26
+ "quip_params": {
27
+ "K": 4,
28
+ "L": 16,
29
+ "V": 2,
30
+ "codebook": "bitshift",
31
+ "codebook_version": 0,
32
+ "decode_mode": "quantlut_sym",
33
+ "split_for_tp": true,
34
+ "td_x": 16,
35
+ "td_y": 16,
36
+ "tlut_bits": 9
37
+ },
38
+ "rms_norm_eps": 1e-05,
39
+ "rope_scaling": {
40
+ "factor": 8.0,
41
+ "high_freq_factor": 4.0,
42
+ "low_freq_factor": 1.0,
43
+ "original_max_position_embeddings": 8192,
44
+ "rope_type": "llama3"
45
+ },
46
+ "rope_theta": 500000.0,
47
+ "tie_word_embeddings": false,
48
+ "torch_dtype": "bfloat16",
49
+ "transformers_version": "4.45.2",
50
+ "use_cache": true,
51
+ "vocab_size": 128256
52
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.45.2"
12
+ }
model-00001-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb853e920c912c15bb8ab443fa85a3b576df35fc8e8a4de0bf5d2239d7356295
3
+ size 4924644256
model-00002-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dd0f7a7f2455adff7ea0a639731150448552665f140e15ce917ffcaa647ce0b
3
+ size 4784559328
model-00003-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:734df5954bca402b4d78aaadb45838c93d92e7c38f6dab699013419e6623aec7
3
+ size 4784559328
model-00004-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59b067068fe8f0901c5c90e40e157625e4b25fa1d09676c067200e0d88da2889
3
+ size 4784559328
model-00005-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cce82a14e1d994c2de72614bbd140d1518b7ca70f4826d148d090499b36c134
3
+ size 4784559432
model-00006-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0650eaeb15263f425d02d2e90282adc9aac9c7f095bfd45892dbf7dbd47d48b6
3
+ size 4784559440
model-00007-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e6de5b0ecabcca7cac410b54c34344f10a0893380e444726d4be33cbd7c25b5
3
+ size 4784559440
model-00008-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2349d4beb027962816aa8ed1db56f02050ec7a57c48688241a68b1125ce6f14
3
+ size 4784559440
model-00009-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bc923acb7a2c379d906fb0c741be85403547408ad7093b0618e0171d61592a4
3
+ size 4784559440
model-00010-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:715d75d8fd437a626351a74b8b792d87bf2be2f63acb9486ea14eb0258844f04
3
+ size 4784559440
model-00011-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45f55b3fb4506c09c5584897129659a1af467bae772804e5e8686f9ff8a29194
3
+ size 4784559440
model-00012-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:070ac6ba6038eaddf3566e13f6d87c13abb1530ddcfe09f4ef47718cabb75c56
3
+ size 4784559440
model-00013-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199062beeecc7eac2672ca19385c44c8516fd9ec8752e8bd58c8df1fe61992f4
3
+ size 4784559440
model-00014-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:320feefcda9ee6bbf7843567787b8e2187a62c50d81c12a53260bebe9e8de3f6
3
+ size 4784559440
model-00015-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a8715edfd24f0ef757c88578d0317a8a012f2c40a88bfdc13c51792571fe32
3
+ size 4784559440
model-00016-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f28d9e69c7274e5d9c1ef4cb6109084780427db518e6364c680e8e64ff063780
3
+ size 4784559440
model-00017-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10d8706fcc5536b4ee298b756b820385882e8029d00812e9fa9a509561bddf40
3
+ size 4784559440
model-00018-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80a71d23a392c7c51c80f5790ba04326fff05311e77ced5dfb1fa7d5721b15a5
3
+ size 4784559440
model-00019-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06384a4bba1a5037dc9edae615ab8182b6f1b2be54a810e2e7eaa1381557489e
3
+ size 4784559440
model-00020-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:030313ca91deb44a17e47cfd97606767d0ec55982aef63d9b4ba19517e6385ad
3
+ size 4784559440
model-00021-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5275cef1047bccb0fdc882b6752a32aa2f3c26b6427d4b92c13e1e6e83b1e385
3
+ size 4784559440
model-00022-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddaed62e5aa9ddba18b8923663d46c83153431fe8d5883b2e97609c3aad750ee
3
+ size 4784559440
model-00023-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d85ea44149d6f535a11093f850cb0b4e5d2babc1e12c51e333c2e3ba7e0bc52
3
+ size 4784559440
model-00024-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:534e1d00b14eeac998844d24174bebbd3ee22ed8c1a02d77502dcb6aba77b9c7
3
+ size 4784559440
model-00025-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f312d4c84e05e7c4061f000fabdab1eb66f0e0ccc80173cf092ea993560fa75
3
+ size 4784559440
model-00026-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab8eb73f87d7ec1c8ee92140cf1f479aa2ae02d48016fdc6f11ae8149266bf6a
3
+ size 4784559440
model-00027-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbb8c10de4ba138cb5b75ab1c9178688e0c9dc016bd57446830682e5231f70e3
3
+ size 4784559440
model-00028-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e63e4952f613ae073b5aba84cb0b667df1060d3a257bd3bad674e2cbb763cf06
3
+ size 4784559440
model-00029-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42ddeaddec8bb34d79b0d037eeb58fc198b38911216f08ad94c2bbab328b1844
3
+ size 4784559440
model-00030-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d55738921485b99e0ba422f18263b3b16fb246fa830e38acd609b4e6a39237bb
3
+ size 4784559440
model-00031-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1eb091533a64700e483ca482a9b7a2a196f798fb96ad034054ddf94e8b15035
3
+ size 4784559440
model-00032-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d061e15a2104288a8cdd6c79043815c9a19f110002a1b4147c667230eb73dbd6
3
+ size 4784559440
model-00033-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d97a2a798b8854d202aab917e9e599f4152f69da0ef066f691a541bad5f607fb
3
+ size 4784559440
model-00034-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3db508eea5c86933fcc36f64eaf8ce48ab09b7a91e96985bd2c350fe3515a509
3
+ size 4784559440
model-00035-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:978eadb283a16c0f09de96855cdcc1cb699432d9cdd6842bfa32c1a4ec3e080b
3
+ size 4784559544
model-00036-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:598baee728eb850230af4ceec480bd016727a927c84ce0372454a37b4979e65a
3
+ size 4784559552
model-00037-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2861f7c4ecbab987c1b6223c88f769f825be950653f1aeac183366ab7b3574a7
3
+ size 4784559552
model-00038-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a14300eab5e140f012c8430e7268077174bdc5f64786fc3574bdf0fa58519425
3
+ size 4784559552
model-00039-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c167a62089f3d8846f6e5f2d8a6aebe0c4d88911d1b3877ae860e73022060c1d
3
+ size 4784559552
model-00040-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2396809fffd0accaac360308ccbf1facd2d587b3fe93f15f84a63b0cff5b2e2f
3
+ size 4784559552
model-00041-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cdae08a1ae3b7ef15aa1ebfdd22fc7faafabd18366b110a92d9dc73cf2466c0
3
+ size 4784559552
model-00042-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8266584f0dbec606b412e7b52bb7d27c2d65352dde1b6b24b64dd617b773648
3
+ size 4784559552
model-00043-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00736c83503d93a500a8df46e93d657b5a3154c5812fe58314e8d218dedf53ad
3
+ size 4062640880
model-00044-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
3
+ size 4202692736
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff