Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +29 -0
- generation_config.json +8 -0
- model-00001-of-00106.safetensors +3 -0
- model-00002-of-00106.safetensors +3 -0
- model-00003-of-00106.safetensors +3 -0
- model-00004-of-00106.safetensors +3 -0
- model-00005-of-00106.safetensors +3 -0
- model-00006-of-00106.safetensors +3 -0
- model-00007-of-00106.safetensors +3 -0
- model-00008-of-00106.safetensors +3 -0
- model-00009-of-00106.safetensors +3 -0
- model-00010-of-00106.safetensors +3 -0
- model-00011-of-00106.safetensors +3 -0
- model-00012-of-00106.safetensors +3 -0
- model-00013-of-00106.safetensors +3 -0
- model-00014-of-00106.safetensors +3 -0
- model-00015-of-00106.safetensors +3 -0
- model-00016-of-00106.safetensors +3 -0
- model-00017-of-00106.safetensors +3 -0
- model-00018-of-00106.safetensors +3 -0
- model-00019-of-00106.safetensors +3 -0
- model-00020-of-00106.safetensors +3 -0
- model-00021-of-00106.safetensors +3 -0
- model-00022-of-00106.safetensors +3 -0
- model-00023-of-00106.safetensors +3 -0
- model-00024-of-00106.safetensors +3 -0
- model-00025-of-00106.safetensors +3 -0
- model-00026-of-00106.safetensors +3 -0
- model-00027-of-00106.safetensors +3 -0
- model-00028-of-00106.safetensors +3 -0
- model-00029-of-00106.safetensors +3 -0
- model-00030-of-00106.safetensors +3 -0
- model-00031-of-00106.safetensors +3 -0
- model-00032-of-00106.safetensors +3 -0
- model-00033-of-00106.safetensors +3 -0
- model-00034-of-00106.safetensors +3 -0
- model-00035-of-00106.safetensors +3 -0
- model-00036-of-00106.safetensors +3 -0
- model-00037-of-00106.safetensors +3 -0
- model-00038-of-00106.safetensors +3 -0
- model-00039-of-00106.safetensors +3 -0
- model-00040-of-00106.safetensors +3 -0
- model-00041-of-00106.safetensors +3 -0
- model-00042-of-00106.safetensors +3 -0
- model-00043-of-00106.safetensors +3 -0
- model-00044-of-00106.safetensors +3 -0
- model-00045-of-00106.safetensors +3 -0
- model-00046-of-00106.safetensors +3 -0
- model-00047-of-00106.safetensors +3 -0
- model-00048-of-00106.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./megacarcoroni",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 140,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 10000.0,
|
24 |
+
"tie_word_embeddings": false,
|
25 |
+
"torch_dtype": "float32",
|
26 |
+
"transformers_version": "4.37.2",
|
27 |
+
"use_cache": false,
|
28 |
+
"vocab_size": 32000
|
29 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.37.2",
|
7 |
+
"use_cache": false
|
8 |
+
}
|
model-00001-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b21385d70b303324eff225a6b6a8705975b805cb23ebe1fd18e75405d2846de4
|
3 |
+
size 4806739440
|
model-00002-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d2c8dcf3a734d0d7e73dae05b975197664be5229202875018d1f8ab23474aa8
|
3 |
+
size 4630578440
|
model-00003-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f000c6dd16e76bcf456cdc84853be3c6d01fa131c6d7a7399183296be28ec90f
|
3 |
+
size 4362142864
|
model-00004-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67386c6a282a1defe3f3c9636f6b165b14e81abc96665db9e4de6d68a04eab5c
|
3 |
+
size 4966188864
|
model-00005-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a96516b9e430fa970a82fa415bedae34bd2c61f45d9c20218bb8064066d44add
|
3 |
+
size 4362142864
|
model-00006-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1716a29f0aa0e9e8cce505d0f1fd06aff03e090d04ebe402d37531cd49a8f13
|
3 |
+
size 4362142864
|
model-00007-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9f305229739d3eef00d6df105adfd795cd6381307e887e20c1087fbcbbedc72
|
3 |
+
size 4966188864
|
model-00008-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02ff2b92df7629fa797a2afc729d2bdedf1fd627c2a1eeadb6dc2475c8a5a4f0
|
3 |
+
size 4362142880
|
model-00009-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5d017e765d91e0e8d927504e7d75cb746a47f5fabe8c2e51d7f48af110a9220
|
3 |
+
size 4362142872
|
model-00010-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d24b98baef4e5bb8b97646113b3595e3736b09bdae48200635fb0466c93e19ae
|
3 |
+
size 4966188880
|
model-00011-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a417e07496ddc82043773c786e11e1e5d5955d542b59f9ad66d0ee7a66e3c1e0
|
3 |
+
size 4362142872
|
model-00012-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5ffac5372b71c252999d3f419ee635a6b7f962d8819dfe53e66ec4c398041f8
|
3 |
+
size 4362142872
|
model-00013-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:587adef026b7eec7f0553dfbd34fff62737f6e220e729b16325262b595149530
|
3 |
+
size 4966188880
|
model-00014-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ef65978f45eb6f4bf9e9d30cc0909c327110980b183efd4594411b09bd7f210
|
3 |
+
size 4362142872
|
model-00015-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:531cbe73ae058d9a9941332853a6f35c95fcdce481328e48c333305a180cd143
|
3 |
+
size 4362142872
|
model-00016-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c71c6f14cc4cda9cb27811748a811e4b7d24ce9195a9e9d4e83b247319b56fa
|
3 |
+
size 4966188880
|
model-00017-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a5c74e24d8967dc7ea1cf810b29cb8cd81e7ccbf1ad2785b063df776f84a0cd
|
3 |
+
size 4362142872
|
model-00018-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e769b9d5c25540f063059451621d5dca8ff3ad2ff6be1034844f876ea49f89d1
|
3 |
+
size 4362142872
|
model-00019-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2635f058a77897f09ca9b13b11b13dc4ac04c006c3f8f940b67b98f963387f3
|
3 |
+
size 4966188880
|
model-00020-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d822ebbdc83097720e2a7941218c31696c3f27921e198e63fd53b6e7042a16e1
|
3 |
+
size 4362142872
|
model-00021-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51c54f792ee91def281219b3976d3f58009bb282e18537fd3127045ffdfe5499
|
3 |
+
size 4362142872
|
model-00022-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4303fed0f736eca7917344106b2f14ea587ee74663b151feb5c3fec0d1fa246
|
3 |
+
size 4966188880
|
model-00023-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6306da4afe04018ba971f2ac1fed9efa26d86ddd4acadb820a7e4db021dd48bb
|
3 |
+
size 4362142872
|
model-00024-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a97dbd0a8416b96016f774259a422e0ef15f1484ff3ae4a1569aa6f350f6242
|
3 |
+
size 4362142872
|
model-00025-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fb5e4f97dd0d43e428e9e9bb6cbba50609ac33061d7532c7b3ec853b7efa31e
|
3 |
+
size 4966188880
|
model-00026-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8094b9c97244819865d4624b59415d8ffc3769f38399b8cf9da0c283da49c62a
|
3 |
+
size 4362142872
|
model-00027-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed2bca02e0193a2d52acb710cf40fbce0f410e8fadb0bb4187561a131948e6ed
|
3 |
+
size 4362142872
|
model-00028-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95948f02180a8778c585a79ced8b06894b65df27541f364581566a5b2a3e360b
|
3 |
+
size 4966188880
|
model-00029-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99c3bcf80561fad4f2eae54f728c57b5b35d09d44439a82adb53c650f9bdc9b1
|
3 |
+
size 4362142872
|
model-00030-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f81828f963b9482f607b1ffa8f2d39acabd29a24b460f7a842e1f0d0672a8db
|
3 |
+
size 4362142872
|
model-00031-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:030e175150d0cb29de1cc1c9e24a91e58f35b76f3883b7195f22c504e5098b55
|
3 |
+
size 4966188880
|
model-00032-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:722b12e8fd3378b8925a00c0f1e0b5b6cdc18820dfda24e4dd55a0a32c2bea70
|
3 |
+
size 4362142872
|
model-00033-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75a2ef7a447d5e03996ca2d014d535297fd40aeabaecb31ffacfe677c9f10d7c
|
3 |
+
size 4362142872
|
model-00034-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34eb22eb6a2e98e8a7faaf2a65cf3a536beb5eeaaf53a8f55d71ba980c43abb6
|
3 |
+
size 4966188880
|
model-00035-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb818d41c370749dbb292b56ef05e5e546b46a17ac183fe7e1b71a42aee46fdd
|
3 |
+
size 4362142872
|
model-00036-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f21134cc180b8dfb351f0e9efb05e425d60bfcd1e0225ffe3f5ea2287c3e336
|
3 |
+
size 4362142872
|
model-00037-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8dd7c663b2f4418e4f19661796186026035eb514cc05361668abab99ba8c6b9
|
3 |
+
size 4966188880
|
model-00038-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7624ee696b22aa2ef62cc74b3a24a35a5a5cf4941cd10ae925fb83493750bd6
|
3 |
+
size 4362142872
|
model-00039-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8996cf449c3096af63066a0dae3cd5b2636e74afcfd07c510259de7ffc35184
|
3 |
+
size 4362142872
|
model-00040-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4176c897ae65fb2d632b00048e7fe30e2d60e5e1284360f67af449d0d15d7269
|
3 |
+
size 4966188880
|
model-00041-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b52e28388227b546e024693c9622dc29f10fbf344002f3f1c7602d6cbe79a66
|
3 |
+
size 4362142872
|
model-00042-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb1087ec8075176256dd34381fbcd66aae8bdf13eb1b825a9c24c864ac5a8793
|
3 |
+
size 4362142872
|
model-00043-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11c94da85047d84a480ecf5888646189a1c0322c05c3e028be12111603eb1344
|
3 |
+
size 4966188880
|
model-00044-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6d579b80f3459bab63df71cb5a8c8f0349164f44e582e57d0a8f738870025a6
|
3 |
+
size 4362142872
|
model-00045-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bda6b524e00581f7a24ccf7a2a94260a6107ba82dba4273a161e663f47370cf
|
3 |
+
size 4362142872
|
model-00046-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dab034260ae166d7c17e4dcdf1d535ba50efbfd4fc55706342ce6995c06ffc7
|
3 |
+
size 4966188880
|
model-00047-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c655c806521fc6bbf5992ebcc0c7d31894af558ab29eae0dc08e40087cbd4e2
|
3 |
+
size 4362142872
|
model-00048-of-00106.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:366b0303c30c1059ad42c585e7ba5b3e1e37ddf6e0ca2635a77f6b8a73ad3b6b
|
3 |
+
size 4362142872
|