jiminHuang
commited on
Commit
•
d27dcfa
1
Parent(s):
e9d78da
Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +28 -0
- generation_config.json +10 -0
- model-00001-of-00061.safetensors +3 -0
- model-00002-of-00061.safetensors +3 -0
- model-00003-of-00061.safetensors +3 -0
- model-00004-of-00061.safetensors +3 -0
- model-00005-of-00061.safetensors +3 -0
- model-00006-of-00061.safetensors +3 -0
- model-00007-of-00061.safetensors +3 -0
- model-00008-of-00061.safetensors +3 -0
- model-00009-of-00061.safetensors +3 -0
- model-00010-of-00061.safetensors +3 -0
- model-00011-of-00061.safetensors +3 -0
- model-00012-of-00061.safetensors +3 -0
- model-00013-of-00061.safetensors +3 -0
- model-00014-of-00061.safetensors +3 -0
- model-00015-of-00061.safetensors +3 -0
- model-00016-of-00061.safetensors +3 -0
- model-00017-of-00061.safetensors +3 -0
- model-00018-of-00061.safetensors +3 -0
- model-00019-of-00061.safetensors +3 -0
- model-00020-of-00061.safetensors +3 -0
- model-00021-of-00061.safetensors +3 -0
- model-00022-of-00061.safetensors +3 -0
- model-00023-of-00061.safetensors +3 -0
- model-00024-of-00061.safetensors +3 -0
- model-00025-of-00061.safetensors +3 -0
- model-00026-of-00061.safetensors +3 -0
- model-00027-of-00061.safetensors +3 -0
- model-00028-of-00061.safetensors +3 -0
- model-00029-of-00061.safetensors +3 -0
- model-00030-of-00061.safetensors +3 -0
- model-00031-of-00061.safetensors +3 -0
- model-00032-of-00061.safetensors +3 -0
- model-00033-of-00061.safetensors +3 -0
- model-00034-of-00061.safetensors +3 -0
- model-00035-of-00061.safetensors +3 -0
- model-00036-of-00061.safetensors +3 -0
- model-00037-of-00061.safetensors +3 -0
- model-00038-of-00061.safetensors +3 -0
- model-00039-of-00061.safetensors +3 -0
- model-00040-of-00061.safetensors +3 -0
- model-00041-of-00061.safetensors +3 -0
- model-00042-of-00061.safetensors +3 -0
- model-00043-of-00061.safetensors +3 -0
- model-00044-of-00061.safetensors +3 -0
- model-00045-of-00061.safetensors +3 -0
- model-00046-of-00061.safetensors +3 -0
- model-00047-of-00061.safetensors +3 -0
- model-00048-of-00061.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/workspace/LLMindCraft/saved_models/finetuned_mix_pmcllama_new",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pretraining_tp": 1,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_scaling": null,
|
22 |
+
"rope_theta": 10000.0,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"torch_dtype": "float32",
|
25 |
+
"transformers_version": "4.36.2",
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 32000
|
28 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 1,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"max_length": 4096,
|
6 |
+
"pad_token_id": 0,
|
7 |
+
"temperature": 0.6,
|
8 |
+
"top_p": 0.9,
|
9 |
+
"transformers_version": "4.36.2"
|
10 |
+
}
|
model-00001-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2db0acafecfccc738d19ece258f4e1b7597b2a289a365d209bd2e395d23b69fd
|
3 |
+
size 4806739440
|
model-00002-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3c46467b2b79eaad5457320abff953df94699a5263de9206075502d7283b50e
|
3 |
+
size 4630578440
|
model-00003-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a436ce211f289059f7d50f47bf245644cb2ab29440f1bd636b75ee28c4104694
|
3 |
+
size 4362142864
|
model-00004-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d862eac8b45abcb047ac33ee983da23f937a000b17d7123364e04b8179e27b02
|
3 |
+
size 4966188864
|
model-00005-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa543be49fe943cedd7eb5c8a3f728787efe54a17022d17f65d872e904e3040c
|
3 |
+
size 4362142864
|
model-00006-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63b5d9f4406e9dc739a911af8c0be6ae490dff7bb4db5dbfd599b31a36b14b68
|
3 |
+
size 4362142864
|
model-00007-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcd828cf4e1671229559c47bb6746a7eb5464b15d11711871a273abba988f6f1
|
3 |
+
size 4966188864
|
model-00008-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15a99146474f29974b9216f578c083fb90dc4ada466895a40b098ccd2acc9baf
|
3 |
+
size 4362142880
|
model-00009-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39840568baf42b74638dafcc244afc35b44c33a01c3ca2c0c8274386193929f0
|
3 |
+
size 4362142872
|
model-00010-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d779c06b6affccd637d3910eeb3d9f64ac5065fdd8903bc203f0e577db9763cc
|
3 |
+
size 4966188880
|
model-00011-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea5b6bfd0c1a76438ef89298d831224d096f4aa8ec943f8439265b094abcdf15
|
3 |
+
size 4362142872
|
model-00012-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a43f3e455daa5355c2fff44ec8ca69ba831e2105a1a8b049f29b3c6fa026e48
|
3 |
+
size 4362142872
|
model-00013-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7186e6265cf2ff33c468049eb90d57d7f550e40243b48dff41e9c913d202d97
|
3 |
+
size 4966188880
|
model-00014-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ea495c0c92d7f6041cd3cdca6fb15d7588611db1a0b606953fb3e804f462386
|
3 |
+
size 4362142872
|
model-00015-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05b8d12b94604b39e8e9f75c61e69828bd8432938fab8fac6accfd4eb5064104
|
3 |
+
size 4362142872
|
model-00016-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97e368921f2f98026d7eef8d23ea9973f330575adb00bd387140956b9f97ba84
|
3 |
+
size 4966188880
|
model-00017-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c34365354a97c5c2cf0dd7fba1e56081108ca20463535bf042115bb3a1aef28
|
3 |
+
size 4362142872
|
model-00018-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:255b41954e2f55c6faf5b11ff05a4a617eb8386dc8fdb32717b108076e7ecbce
|
3 |
+
size 4362142872
|
model-00019-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5340da8d511aeea90db9797fc945b584e3c599c7aa2f505687a5ef0d08577d7a
|
3 |
+
size 4966188880
|
model-00020-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca198ff14cf0e8d716355300ff137cf21da2791daf8e8fb42f9bb26dece8bdcd
|
3 |
+
size 4362142872
|
model-00021-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8de8b132cf4c86c0d6cd1c2978ce0eb3c2ec2a5aa8109d9f0d74465f480c4f0
|
3 |
+
size 4362142872
|
model-00022-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5ade6c9413641b67bbd1e8b038b5fafdafe0af84881aa22110805b576636f95
|
3 |
+
size 4966188880
|
model-00023-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6291113f159e23039b38eaf943cba73a5748c30326757af182e86556076fcf22
|
3 |
+
size 4362142872
|
model-00024-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfe54840e4c6c157cdb8854df7e09ec0edb32d85c3051c5b3e0a54b3f8e774bf
|
3 |
+
size 4362142872
|
model-00025-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6765f6b20185267330d9c140c57304228ba6cfcf812a72e9fec901645b9fbe4b
|
3 |
+
size 4966188880
|
model-00026-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:503e3906d5fe457296c5e3a81c23ad3231f43dea214c5412c5b1fa780a1ea66a
|
3 |
+
size 4362142872
|
model-00027-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3fa2f47175f0ca182040a983d91a02404671071f672f861325684ba8adc4029
|
3 |
+
size 4362142872
|
model-00028-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0004d0d6b18bbc953dff955d8e91b2ad27b59a439246b95faebfa972b7e7815
|
3 |
+
size 4966188880
|
model-00029-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c1ff875c29b44278e3497778e0cecb24573625510b27210416bf16fdd26a453
|
3 |
+
size 4362142872
|
model-00030-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7999f5a9a4b0d1b3fa765829b792cda0079f8c71f33c89a6983eefe29390847d
|
3 |
+
size 4362142872
|
model-00031-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:722b7110657b9fe9df3d761e7e553210b4f3fff56ecc4f2c358c4cfbc9b5f2c2
|
3 |
+
size 4966188880
|
model-00032-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6df97412e052f762594d8e50df66a0ecefa488f16b6d7dc8f32dc25d66ff66a
|
3 |
+
size 4362142872
|
model-00033-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f8e527ba88a9906ac8c592b057a150f899579879f113d558cec3737211e0896
|
3 |
+
size 4362142872
|
model-00034-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9f82cad9089e4d77cc6ef767481d191cc9c1d787515dc4273dbf868fa11d967
|
3 |
+
size 4966188880
|
model-00035-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7faa0a8d4d730c194ca08ddec22ac77f0e15aaae9429ebd962c773508147eae3
|
3 |
+
size 4362142872
|
model-00036-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03237b3d041c0d61e2bb83188cdb52c0dd2222be8177f7e570216950474753b3
|
3 |
+
size 4362142872
|
model-00037-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:765e1ce8a1bb8192f2891cbf73d72e9937b5e30c4ea5a484f08ecb860391117e
|
3 |
+
size 4966188880
|
model-00038-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abe67dca809e62e5e80f3214f1a70f759e77b9422f8e37ec4fd116570ac35e54
|
3 |
+
size 4362142872
|
model-00039-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3ca7f1663399b3fcc3b0629e1081796caa9d9e5cb982eb900ce69aa6c34d46c
|
3 |
+
size 4362142872
|
model-00040-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8464dbaab141ddfbc93f959ae38149abcc71b1b39994e2d40d00e97f7b29a174
|
3 |
+
size 4966188880
|
model-00041-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:861cb380242c96df82b9d8a14ff68dbabb6d9f8ec5f329739d926e2c2dabf6a7
|
3 |
+
size 4362142872
|
model-00042-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1bcb36406d83728b1f52fed8f2ecf8cff23557885f89d0a7859b954e29b99f6
|
3 |
+
size 4362142872
|
model-00043-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2903dbad280b1f49c9bb6a0c379802f5f3c93c8aaea435a5120b159a486e8bdf
|
3 |
+
size 4966188880
|
model-00044-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dd27c3ac937d089b5cc7cd6510d02a73faa32e0de75dad57ef7805c02610fef
|
3 |
+
size 4362142872
|
model-00045-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:970f99654f4072bcc4b1713854630c8d606d30b68008014abbc1ced37b4ceb57
|
3 |
+
size 4362142872
|
model-00046-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bc371bc0051a03f1141f9e7ec36cea08412fc14accc92749959bb36f802ad93
|
3 |
+
size 4966188880
|
model-00047-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c2004bc2db8cecaed4d629398828723f4046e9bb3ffb4396aec063066184ce6
|
3 |
+
size 4362142872
|
model-00048-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2800392d29e8254d1f0ace6b908a5fd79e94d448f23077801adfc3f9c0e2712
|
3 |
+
size 4362142872
|