Upload OPTForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +32 -0
- pytorch_model-00001-of-00053.bin +3 -0
- pytorch_model-00002-of-00053.bin +3 -0
- pytorch_model-00003-of-00053.bin +3 -0
- pytorch_model-00004-of-00053.bin +3 -0
- pytorch_model-00005-of-00053.bin +3 -0
- pytorch_model-00006-of-00053.bin +3 -0
- pytorch_model-00007-of-00053.bin +3 -0
- pytorch_model-00008-of-00053.bin +3 -0
- pytorch_model-00009-of-00053.bin +3 -0
- pytorch_model-00010-of-00053.bin +3 -0
- pytorch_model-00011-of-00053.bin +3 -0
- pytorch_model-00012-of-00053.bin +3 -0
- pytorch_model-00013-of-00053.bin +3 -0
- pytorch_model-00014-of-00053.bin +3 -0
- pytorch_model-00015-of-00053.bin +3 -0
- pytorch_model-00016-of-00053.bin +3 -0
- pytorch_model-00017-of-00053.bin +3 -0
- pytorch_model-00018-of-00053.bin +3 -0
- pytorch_model-00019-of-00053.bin +3 -0
- pytorch_model-00020-of-00053.bin +3 -0
- pytorch_model-00021-of-00053.bin +3 -0
- pytorch_model-00022-of-00053.bin +3 -0
- pytorch_model-00023-of-00053.bin +3 -0
- pytorch_model-00024-of-00053.bin +3 -0
- pytorch_model-00025-of-00053.bin +3 -0
- pytorch_model-00026-of-00053.bin +3 -0
- pytorch_model-00027-of-00053.bin +3 -0
- pytorch_model-00028-of-00053.bin +3 -0
- pytorch_model-00029-of-00053.bin +3 -0
- pytorch_model-00030-of-00053.bin +3 -0
- pytorch_model-00031-of-00053.bin +3 -0
- pytorch_model-00032-of-00053.bin +3 -0
- pytorch_model-00033-of-00053.bin +3 -0
- pytorch_model-00034-of-00053.bin +3 -0
- pytorch_model-00035-of-00053.bin +3 -0
- pytorch_model-00036-of-00053.bin +3 -0
- pytorch_model-00037-of-00053.bin +3 -0
- pytorch_model-00038-of-00053.bin +3 -0
- pytorch_model-00039-of-00053.bin +3 -0
- pytorch_model-00040-of-00053.bin +3 -0
- pytorch_model-00041-of-00053.bin +3 -0
- pytorch_model-00042-of-00053.bin +3 -0
- pytorch_model-00043-of-00053.bin +3 -0
- pytorch_model-00044-of-00053.bin +3 -0
- pytorch_model-00045-of-00053.bin +3 -0
- pytorch_model-00046-of-00053.bin +3 -0
- pytorch_model-00047-of-00053.bin +3 -0
- pytorch_model-00048-of-00053.bin +3 -0
- pytorch_model-00049-of-00053.bin +3 -0
config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "huge",
|
3 |
+
"_remove_final_layer_norm": false,
|
4 |
+
"activation_dropout": 0.0,
|
5 |
+
"activation_function": "gelu",
|
6 |
+
"architectures": [
|
7 |
+
"OPTForCausalLM"
|
8 |
+
],
|
9 |
+
"attention_dropout": 0.1,
|
10 |
+
"bias": false,
|
11 |
+
"bos_token_id": 0,
|
12 |
+
"do_layer_norm_before": true,
|
13 |
+
"dropout": 0.1,
|
14 |
+
"eos_token_id": 2,
|
15 |
+
"ffn_dim": 40960,
|
16 |
+
"hidden_size": 10240,
|
17 |
+
"init_std": 0.02,
|
18 |
+
"layer_norm_elementwise_affine": false,
|
19 |
+
"layerdrop": 0.0,
|
20 |
+
"learned_embeddings": true,
|
21 |
+
"max_position_embeddings": 2048,
|
22 |
+
"model_type": "opt",
|
23 |
+
"num_attention_heads": 80,
|
24 |
+
"num_hidden_layers": 96,
|
25 |
+
"pad_token_id": 1,
|
26 |
+
"scale_embeddings": false,
|
27 |
+
"torch_dtype": "float32",
|
28 |
+
"transformers_version": "4.24.0",
|
29 |
+
"use_cache": true,
|
30 |
+
"vocab_size": 50000,
|
31 |
+
"word_embed_proj_dim": 10240
|
32 |
+
}
|
pytorch_model-00001-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d59b3a886e5aa10edbb30abf036990ef58825e045bb04e8b58209b6b7d3bbf55
|
3 |
+
size 8843724059
|
pytorch_model-00002-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c1e4d079d4798fe416ef239cd783429dcf025cdafd2433264a59336e8564b3b
|
3 |
+
size 9647850097
|
pytorch_model-00003-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27411f3684c214b3bed915bb50ff6db5e5e664d7fab89153d3565cee12a98d06
|
3 |
+
size 9647932551
|
pytorch_model-00004-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fdc5096fe4d093955fe9d63b31d7ad7de4677bb65d73219a96f4c279fad339d
|
3 |
+
size 9647932527
|
pytorch_model-00005-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be2014f932d96d19987fcfaa5c480ad754373e8c8dd0ca0e0232eb53e0433295
|
3 |
+
size 9647932527
|
pytorch_model-00006-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e92b24a150be4f09c4863553f55d42752cc3d0ce7d481851754b6462a3922e9
|
3 |
+
size 8389558961
|
pytorch_model-00007-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cc2c149b20f1aaa2741fa7d55da6fc0d81e936e24d27eea9a46885d474768b0
|
3 |
+
size 8389518683
|
pytorch_model-00008-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2985b25da8b2d5864e86da483910a445bbb4a7c426888c3f09e4cbbd076d75a2
|
3 |
+
size 9647850161
|
pytorch_model-00009-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22a7eddf45ec1c4c287c9628857fd1eed0b78adbd305ee2c1491e78dbe99e297
|
3 |
+
size 9647932551
|
pytorch_model-00010-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b17642319c68abfa6842133c420126090e4cc4475eac0bca3cd61cd0009519b
|
3 |
+
size 9647932527
|
pytorch_model-00011-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8b2af6cb662d28403e110c39fe625319f176f870758a0d60454a7c77455d45e
|
3 |
+
size 9647932527
|
pytorch_model-00012-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3f1e6c1dacfa33e94cb3434243913a2139c16b8462a1fa4be79e3c326de3858
|
3 |
+
size 8389558961
|
pytorch_model-00013-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b427688b8876bfb01199d321bac1d214a839f6f229e84e9ac930e215616a8ec7
|
3 |
+
size 8389518683
|
pytorch_model-00014-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:439d9faaec3ebde80e9e16d6b57e7aeee702b79b65f0dd0bf3b7476ff4bd01c7
|
3 |
+
size 9647850161
|
pytorch_model-00015-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0088e7c2f90924a001120d96abc152da76593f04d8ad2cb8402cd265611d7249
|
3 |
+
size 9647932551
|
pytorch_model-00016-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:332baebd649bfdf03da54d98486b3ecaa61a2aec679eccb42ca4f276a66c2468
|
3 |
+
size 9647932527
|
pytorch_model-00017-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86d71304be21ce2878edec937bfe93b12808c16befcb68eba647d3291ba92446
|
3 |
+
size 9647932527
|
pytorch_model-00018-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cac68442c8ac028e33c4d32253f9dbecf73cbe92ad1c51c006d08a277ba2fa3c
|
3 |
+
size 8389558961
|
pytorch_model-00019-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4947319c1c2a826ae2dd4092d47ad29ac76f2d532b1f79721c785b27ce7e51e
|
3 |
+
size 8389518683
|
pytorch_model-00020-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e31d1a7b8489c34a73367ca7ca8ecd3857c8c9c411d7fdfbe2f54e6b6e449d1f
|
3 |
+
size 9647850161
|
pytorch_model-00021-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc1e03919c55300cfafcba4faf2ba71b94347f20c739b93845c5159eda973c3b
|
3 |
+
size 9647932551
|
pytorch_model-00022-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6e8394911844569d6921e897e9aeb40576a97e74fcc19a09f982b6eb0cfdd93
|
3 |
+
size 9647932527
|
pytorch_model-00023-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc605b13a972a6697ddd942b09b8d140fa38a4604ce4d5329227e22d1dddbec5
|
3 |
+
size 9647932527
|
pytorch_model-00024-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acb0c1ff775ecc798d18863419ca4aa06821f14847f1e596b149390f17c45868
|
3 |
+
size 8389558961
|
pytorch_model-00025-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1c22ff38dd4bd849bd77205fa40c942cce251b6fa48eeec7dd562a22cd34095
|
3 |
+
size 8389518683
|
pytorch_model-00026-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:188d6daa7773d5a55c3b26b99513d1820f4125f308c82e187801afc429459a64
|
3 |
+
size 9647850161
|
pytorch_model-00027-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de38d2ef277337a1aad49674577c2f3309b2acb9de6f4a1c0436ac1846db1729
|
3 |
+
size 9647932551
|
pytorch_model-00028-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed57a657194b6f763c8b07eb319d7a01764198a138feddd5ed0e93703191bdd0
|
3 |
+
size 9647932527
|
pytorch_model-00029-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1192a4ad8f99abd991854a6bdac96b59426df325be6e597c4abd9262efa39e5
|
3 |
+
size 9647932527
|
pytorch_model-00030-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa8e96f0fb352fe4ce57e78041d6eefc26b5c05b393326393e479a136b2192e0
|
3 |
+
size 8389558961
|
pytorch_model-00031-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd3da23a723f093eae8d277bfdfa62cdc05a8fd8cfbaf402182105f239e3933f
|
3 |
+
size 8389518683
|
pytorch_model-00032-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c32df5861d52b9aa5614c59641c90103b79aec6e5c951f6c20637ba441fd8dd
|
3 |
+
size 9647850161
|
pytorch_model-00033-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f696d41065eb596da0d45224fefa65ee8d654442a46725248f1a6f098efd39f3
|
3 |
+
size 9647932551
|
pytorch_model-00034-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17ac49ae47d578c79dc30f4a9f6634e7deae50258cb40f8df10c91432a1be384
|
3 |
+
size 9647932527
|
pytorch_model-00035-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57668df277444ea9512a3a459395918fc8f665ccfd876c5ebec444d5ce73049d
|
3 |
+
size 9647932527
|
pytorch_model-00036-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e73d8d258aba60ebe1a21bf761ed4323bd12190748a89d1586f2efd35bb05171
|
3 |
+
size 8389558961
|
pytorch_model-00037-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:138ccd7e66807c942a6c3b19ed0afca424350d149bd4c21f34f066756c33cb42
|
3 |
+
size 8389518683
|
pytorch_model-00038-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8901f5e0d834ed11effa0544692757cbdce8a8448d8d8d07ca9165af223e8f9
|
3 |
+
size 9647850161
|
pytorch_model-00039-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ad17ed87f80c6ef2dc37b42b3eb315c97a7a95c8c97f9e2624e7ffb7dc4fc94
|
3 |
+
size 9647932551
|
pytorch_model-00040-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82d337e9c0e55050c7f20800077ecb4e33664a66c2f5c1d393b3f624aa84349e
|
3 |
+
size 9647932527
|
pytorch_model-00041-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b91b32f5472d0fe3750884151db6c29e92922b11d1c8dffe82181ddabd111a1b
|
3 |
+
size 9647932527
|
pytorch_model-00042-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1b89d52d795648a42e8d4b205079d37698c1ade319f032d3773f858163f429a
|
3 |
+
size 8389558961
|
pytorch_model-00043-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a6126fde8e1ff72db4ac230ccddc74d76ff1923b188b6843ef2e166dd86b3a6
|
3 |
+
size 8389518683
|
pytorch_model-00044-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec6fe592118641a4655e276dd97898365365690a3d70c0484b6f3579055069a1
|
3 |
+
size 9647850161
|
pytorch_model-00045-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1187a24d64f28964976bd2ba5707ab017a6de42539d133ff393164286c1ae872
|
3 |
+
size 9647932551
|
pytorch_model-00046-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42dda95f62e3a8ca9d9b273c6115239e209dc6dcc1e3c6f1d8ca813b3c55c962
|
3 |
+
size 9647932527
|
pytorch_model-00047-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8709f68d2f0f5e86ab9b4c1125da6c9645cdc99d1790cf9829bee100f9bbaf15
|
3 |
+
size 9647932527
|
pytorch_model-00048-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b08cb4b5da8cf2ac29418b8818ffc447921a2ed012c03e6e2e2296c91fadeb97
|
3 |
+
size 8389558961
|
pytorch_model-00049-of-00053.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d05d80333d36eb4971ef0e8ed39fcc78389a628d4434c9e200560113e4c5df2a
|
3 |
+
size 8389518683
|