monology commited on
Commit
c7af9ee
1 Parent(s): 83dd214

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +40 -0
  2. config.json +29 -0
  3. mergekit_config.yml +24 -0
  4. model-00001-of-00070.safetensors +3 -0
  5. model-00002-of-00070.safetensors +3 -0
  6. model-00003-of-00070.safetensors +3 -0
  7. model-00004-of-00070.safetensors +3 -0
  8. model-00005-of-00070.safetensors +3 -0
  9. model-00006-of-00070.safetensors +3 -0
  10. model-00007-of-00070.safetensors +3 -0
  11. model-00008-of-00070.safetensors +3 -0
  12. model-00009-of-00070.safetensors +3 -0
  13. model-00010-of-00070.safetensors +3 -0
  14. model-00011-of-00070.safetensors +3 -0
  15. model-00012-of-00070.safetensors +3 -0
  16. model-00013-of-00070.safetensors +3 -0
  17. model-00014-of-00070.safetensors +3 -0
  18. model-00015-of-00070.safetensors +3 -0
  19. model-00016-of-00070.safetensors +3 -0
  20. model-00017-of-00070.safetensors +3 -0
  21. model-00018-of-00070.safetensors +3 -0
  22. model-00019-of-00070.safetensors +3 -0
  23. model-00020-of-00070.safetensors +3 -0
  24. model-00021-of-00070.safetensors +3 -0
  25. model-00022-of-00070.safetensors +3 -0
  26. model-00023-of-00070.safetensors +3 -0
  27. model-00024-of-00070.safetensors +3 -0
  28. model-00025-of-00070.safetensors +3 -0
  29. model-00026-of-00070.safetensors +3 -0
  30. model-00027-of-00070.safetensors +3 -0
  31. model-00028-of-00070.safetensors +3 -0
  32. model-00029-of-00070.safetensors +3 -0
  33. model-00030-of-00070.safetensors +3 -0
  34. model-00031-of-00070.safetensors +3 -0
  35. model-00032-of-00070.safetensors +3 -0
  36. model-00033-of-00070.safetensors +3 -0
  37. model-00034-of-00070.safetensors +3 -0
  38. model-00035-of-00070.safetensors +3 -0
  39. model-00036-of-00070.safetensors +3 -0
  40. model-00037-of-00070.safetensors +3 -0
  41. model-00038-of-00070.safetensors +3 -0
  42. model-00039-of-00070.safetensors +3 -0
  43. model-00040-of-00070.safetensors +3 -0
  44. model-00041-of-00070.safetensors +3 -0
  45. model-00042-of-00070.safetensors +3 -0
  46. model-00043-of-00070.safetensors +3 -0
  47. model-00044-of-00070.safetensors +3 -0
  48. model-00045-of-00070.safetensors +3 -0
  49. model-00046-of-00070.safetensors +3 -0
  50. model-00047-of-00070.safetensors +3 -0
README.md CHANGED
@@ -1,3 +1,43 @@
1
  ---
 
 
 
 
 
 
2
  license: apache-2.0
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
+ base_model:
3
+ - tiiuae/falcon-180B
4
+ library_name: transformers
5
+ tags:
6
+ - mergekit
7
+ - merge
8
  license: apache-2.0
9
  ---
10
+ # largefalcon
11
+
12
+ This is a frankenmerge of [tiiuae/falcon-180B](https://huggingface.co/tiiuae/falcon-180B) created using [mergekit](https://github.com/cg123/mergekit).
13
+
14
+ ## Merge Details
15
+
16
+ The following YAML configuration was used to produce this model:
17
+
18
+ ```yaml
19
+ dtype: float16
20
+ merge_method: passthrough
21
+ slices:
22
+ - sources:
23
+ - layer_range: [0, 20]
24
+ model: tiiuae/falcon-180B
25
+ - sources:
26
+ - layer_range: [10, 30]
27
+ model: tiiuae/falcon-180B
28
+ - sources:
29
+ - layer_range: [20, 40]
30
+ model: tiiuae/falcon-180B
31
+ - sources:
32
+ - layer_range: [30, 50]
33
+ model: tiiuae/falcon-180B
34
+ - sources:
35
+ - layer_range: [40, 60]
36
+ model: tiiuae/falcon-180B
37
+ - sources:
38
+ - layer_range: [50, 70]
39
+ model: tiiuae/falcon-180B
40
+ - sources:
41
+ - layer_range: [60, 80]
42
+ model: tiiuae/falcon-180B
43
+ ```
config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "tiiuae/falcon-180B",
3
+ "alibi": false,
4
+ "architectures": [
5
+ "FalconForCausalLM"
6
+ ],
7
+ "attention_dropout": 0.0,
8
+ "bias": false,
9
+ "bos_token_id": 11,
10
+ "eos_token_id": 11,
11
+ "hidden_dropout": 0.0,
12
+ "hidden_size": 14848,
13
+ "initializer_range": 0.02,
14
+ "layer_norm_epsilon": 1e-05,
15
+ "max_position_embeddings": 2048,
16
+ "model_type": "falcon",
17
+ "multi_query": true,
18
+ "new_decoder_architecture": true,
19
+ "num_attention_heads": 232,
20
+ "num_hidden_layers": 140,
21
+ "num_kv_heads": 8,
22
+ "parallel_attn": true,
23
+ "rope_scaling": null,
24
+ "rope_theta": 10000.0,
25
+ "torch_dtype": "float16",
26
+ "transformers_version": "4.39.1",
27
+ "use_cache": true,
28
+ "vocab_size": 65024
29
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dtype: float16
2
+ merge_method: passthrough
3
+ slices:
4
+ - sources:
5
+ - layer_range: [0, 20]
6
+ model: tiiuae/falcon-180B
7
+ - sources:
8
+ - layer_range: [10, 30]
9
+ model: tiiuae/falcon-180B
10
+ - sources:
11
+ - layer_range: [20, 40]
12
+ model: tiiuae/falcon-180B
13
+ - sources:
14
+ - layer_range: [30, 50]
15
+ model: tiiuae/falcon-180B
16
+ - sources:
17
+ - layer_range: [40, 60]
18
+ model: tiiuae/falcon-180B
19
+ - sources:
20
+ - layer_range: [50, 70]
21
+ model: tiiuae/falcon-180B
22
+ - sources:
23
+ - layer_range: [60, 80]
24
+ model: tiiuae/falcon-180B
model-00001-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56db71b2bc483ff840bb7841782e08671e61a3c495fec5f8be62002723f89e3d
3
+ size 9958970992
model-00002-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7d8a1ef64c83f3a1c09eecfae1e3b07596236d318d05a76f4e57d4f633cc0cf
3
+ size 8879580944
model-00003-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ed6b5b5950ee5188e908d6ffbdfed9eeb26f5f6a12d827d9ff5b7f0be95c883
3
+ size 8879580944
model-00004-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c50e4322e610f6e8bdfccc100701ed331891892800e6327687ac6f06087e774
3
+ size 8879580944
model-00005-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b43657438e6f9331c4ec7af0ff2a8ab890f0a9e0cac0e29647e3ab1ec7c1639f
3
+ size 9791842360
model-00006-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81906c631de85f5bd90497d289c5991b0e4870ebc63ca0481c66acae1faa136d
3
+ size 8879461792
model-00007-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93a56c31005fe90da953d79d9e3c881ba5dd2a973469b0fd86b377a146913419
3
+ size 8879580960
model-00008-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:738dbc36ae64dd25c2505e5f0f319128603a8a4d708f89ceacbb65b7705f0e67
3
+ size 8879580960
model-00009-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06047e561973a1ce2c27292e7fd6ce65517269a6de159d5a6bda55f0e6c3df97
3
+ size 8879580960
model-00010-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fc2a8ec74ded572d9c57e9ed3d74c6e9282b9e05384f96087afe9e02b4a7a58
3
+ size 8879580960
model-00011-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17e5c33cbc62fcda123bebac69d9eb5119e6cb639529bd162dacbd6a4ae2759d
3
+ size 8879580960
model-00012-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6abd5f1300ba418883726b7eebc161f656b2950f3fcae2683d75aa11a6526567
3
+ size 8879580960
model-00013-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a165ae6ae21c79d228f01109de80bf04d4db7655fa2aab6d27ec0247050cc436
3
+ size 8879580960
model-00014-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3030a4c27506c06a8c17a304345ff98e27f46a9003d941a75fdedfe930fb09bf
3
+ size 8879580960
model-00015-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f61b3c4b721404857adb782bc712b358b1126dd7d03ea2440f514706c35dc6ed
3
+ size 8879580960
model-00016-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5484f475630e36aff9c2a33a253aa6b0b98b66f35ce5909c09215442828e39b7
3
+ size 8879580960
model-00017-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ad98aee3bf96af6c074a33f86d5faa3e2edd1652fcdae9ef443a46d692b0e96
3
+ size 8879580960
model-00018-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7e853a3e1e201c52d16e5e6178be01ab3933401adcba54ddfedd15f1987b26c
3
+ size 8879580960
model-00019-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f415813972e7d25cc888d2a6ab277cb73ec633f981a3d44a8082e630fb73a02
3
+ size 8879580960
model-00020-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:789cb8040ed33b074be082bb7579a8746ca6e0b461dad197f59ef123fbeabea6
3
+ size 8879580960
model-00021-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d481b57e9df240aec5978a93e96c99cbd5a7d755e75a683a0d47179e48bf3d0e
3
+ size 8879580960
model-00022-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f42a36bf7481675f9abfdef53cca6e48983d392a019bc6b9c58fedbc61ccd1f0
3
+ size 8879580960
model-00023-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0939f6d7957426248c311f056a4e219e057b270ca380f647c1cdfcc127c5e2e
3
+ size 8879580960
model-00024-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccc2c289afdadb9a388394dcdc634459f55385a68dca4881878f61395ab40ccc
3
+ size 8879580960
model-00025-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ac50a4102c20f46fba798de4e4ebb390a8bbe1fa69af4f918654d26e1d21739
3
+ size 8879580960
model-00026-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c821714a0fd8aab515ff87fe4b42af906e3edb4b8c4320077c7360b9f47bca3
3
+ size 8879580960
model-00027-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf34a84f7f6d8b632aec2758923c5c2bdf29dfed6fa4afdaa4b50c2d53d1f2c8
3
+ size 8879580960
model-00028-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10ab8b1215bb520fd2532a47aa102d6a7be09d5c2d5b93fb9ec1df0c1aba0e50
3
+ size 8879580960
model-00029-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cd1ce0160d76c9bc890fafd01763fe05d24b963bac397a7beb4694158eaa874
3
+ size 8879580960
model-00030-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:208d231ec01599b75757c6abfa9e30072af42621e087926f8ba15a27f3c79ab2
3
+ size 8879580960
model-00031-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:234b24f9606609a4a57a8e900c41d317586be3b4a0be5b77e5c0e6f6bd4022a3
3
+ size 8879580960
model-00032-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0032e93b16e4c736756af8c5583b12c729f4bf59313dbfc493cbdab632ac8115
3
+ size 8879580960
model-00033-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74b9ad620d60f30f37d03e708ff4ccf4bd6652183dd9e8f11432d658ef0e5d5b
3
+ size 8879580960
model-00034-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0810c9059ce38526600d18570083da697b5c9f411923bdd4f7aedf013135208a
3
+ size 8879580960
model-00035-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ff772b30e036c04cdcb1d6ff8a2bb1a5612946c093a21738ebc65b999f6dc09
3
+ size 8879580960
model-00036-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a854d13a98b88979070c00fb0346c423c1e7ff72318e52b2105e87da3dc9c5cb
3
+ size 8879580960
model-00037-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:519b5d0782a8e56d9df69dcba8b74b2b057f3b23b63a424f4455f7024e70c77d
3
+ size 8879580960
model-00038-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c175fd5644abf6dc517b03cbc3675c625efbcb95cdbc68042f369ed68ada8fa4
3
+ size 8879580960
model-00039-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce0489c5c97a4e58eee89d896197a95f4a550995b4b48d8c8ef2a9c5e26359c2
3
+ size 8879580960
model-00040-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9087bf99dcdb05335158c7f26727f98315b4406ca3e41e07767999a678b5dd0c
3
+ size 8879580960
model-00041-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a51e5be2546b47e9e4b3496beceae686994790999ff0ea6d03124e04bb9a26f
3
+ size 8879580960
model-00042-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb69e67f02a32d7aaf81e0d177ec3fb176e5f064ee601e9758fdf619ba27ac63
3
+ size 8879580960
model-00043-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85d07c6beb8c7c5f5b792623aec2881f6d8e4367ad025d8ccba075e5e86c093c
3
+ size 8879580960
model-00044-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb6cfb28a4fc245574729b86f701e167a1219d8752cb6995b39e9415b9bef702
3
+ size 8879580960
model-00045-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:843c4285fc306611b39a8b29e332248869fdf5be64a4dd631ad2d625926beb21
3
+ size 8879581000
model-00046-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6360b21f2490f4edf6255f632bfd69fe75d28bb136167f656332965b8e2fd3de
3
+ size 8879581000
model-00047-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee14bd1208ac9afcb0d828f09e6650a437d80068a91fbb29b4d4786e431b9740
3
+ size 8879580968