CharlieFRuan
commited on
Commit
•
26ccf83
1
Parent(s):
9fdecf4
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +41 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_neox",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"use_parallel_residual": false,
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 10240,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"layer_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 50432,
|
12 |
+
"rotary_pct": 1.0,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"context_window_size": 2048,
|
15 |
+
"head_dim": 80,
|
16 |
+
"prefill_chunk_size": 2048,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"ffn_out_dtype": "float32"
|
19 |
+
},
|
20 |
+
"vocab_size": 50432,
|
21 |
+
"context_window_size": 2048,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"mean_gen_len": 128,
|
27 |
+
"max_gen_len": 512,
|
28 |
+
"shift_fill_factor": 0.3,
|
29 |
+
"temperature": 0.7,
|
30 |
+
"repetition_penalty": 1.0,
|
31 |
+
"top_p": 0.95,
|
32 |
+
"conv_template": "redpajama_chat",
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"bos_token_id": 0,
|
35 |
+
"eos_token_id": 0,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"version": "0.1.0"
|
41 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ae66740237759d9fec47fb18747a78d57a6c8fe35375baa6119e1eba1c87e54
|
3 |
+
size 64552960
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f57f4c78b152094aec10b42ecfc0896b3ead2c1529cd8857a707214dcb4a7a9f
|
3 |
+
size 22855680
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1433037461c47209078a982cdf2c0effcc71f20fd54140fc7c7f8639ff6118e9
|
3 |
+
size 29542400
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16ef8f2c41ee486b9eb763bcf1d6cf4d87ea80e763cfe54f6a60e1cffacaf5ba
|
3 |
+
size 29562880
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b07dc7ceb664ffdea2edc1201733df23e4a2a6eb19c13be749c2ea3a4d29d057
|
3 |
+
size 29552640
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c18539ea299d464516bcdc528366933a72479bf9f089fce318762822e83ea59
|
3 |
+
size 29542400
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b67dd64324a28a6c6ed559e6054e5b114041207bc553a41131eb43f7a6614622
|
3 |
+
size 29562880
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7992c420b3f2cc007e6f8fba6e27bf0bee9879683181608e6d16dcbc266b5835
|
3 |
+
size 29552640
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1683840863240bcce116d99a2032735c2082ee93d19e412a4af8d8c28a0e16a
|
3 |
+
size 29542400
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6eee959766d3e47185acf372b4037b9e15965eaa2c00f519dc7985e80a844434
|
3 |
+
size 29562880
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2d55d946c2d9845973ae3d0a33257cb8d5f2ec18badb877c9efc05fb75f11c0
|
3 |
+
size 29552640
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:912ae54afd6cd354640f6869c34e220fac44aae844a5fe7a0c45c4a8969f9490
|
3 |
+
size 29542400
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29c2c58175b9ad6d227fbac239eb7d130fdf0026569c2b31234043cf3d7c6679
|
3 |
+
size 29562880
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0932988579e862f685a1ee996ec3335cb87ab144ba190f5bd6dcc1ff9b137350
|
3 |
+
size 29562880
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c406baaca339ff16b2a697246bfaaf6b0922ccd2e0e1c0238835df083cbcd69
|
3 |
+
size 29552640
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85cfa8c063c02fba02d0f9365f6ba2373c37e91d09d8bd1e5c242c49d7f3b70c
|
3 |
+
size 29542400
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:015e32e0aa06707118e6b9321db9e6fc88453817c240b241d28e454d8fc85ba5
|
3 |
+
size 29562880
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:551e1949015d7e642b903af3986c4903009995b5ad1ed52ae3d14ff75027b5e8
|
3 |
+
size 29552640
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f2cbb900d2bbc7874e9fd456bba84cc873b46135af3fbb112a310f8eec34e52
|
3 |
+
size 29542400
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1fb9063abd3512d769233de4c448e19c57f10f6746b0906328612d32753f7b8
|
3 |
+
size 29562880
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45cacd3877783d085bd0a3b131e16e2ba6ada8a303b736f81bda9e183664c38a
|
3 |
+
size 29552640
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65e767f93f7eb9905ee96f657fe9d4d2517d7c65b433e9ddb8f9253f16304206
|
3 |
+
size 29542400
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:239787a92024c837fe633d0deeaad39bb9a50549b203edea32568a67135783e0
|
3 |
+
size 29562880
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:872a71041b67923f721b36948cc40fe985848d5a91ba5574fa4320c88a47fa4b
|
3 |
+
size 29552640
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb17f9d6976a421f307fa149ccfd9620a2785a683e42118691521a341110efe
|
3 |
+
size 29552640
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be6eb93e7083e1a8a2cb1993374fc1c89bbe5ea5c3d873c09d07076d375254cb
|
3 |
+
size 29542400
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67d5040211c46e7dcb65d97a487c4ca157ef973dd6bb3e17f4390e653744566b
|
3 |
+
size 29562880
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:541a2020f34e6ab71dc3aac7abf143fb970c51d1b51eb1f19d1847a7c393cbd9
|
3 |
+
size 29552640
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05d016a394f238f16d0fa2b10c63dce13d9889cbb63924c66a199d38a377a666
|
3 |
+
size 29542400
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57e642321b0b2b79ceac74b358d295422b5cfc7c3680feeb499c468190ec88df
|
3 |
+
size 29562880
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3130517f8de95859511e6b358a9c4169bc23d2516af177117404fccad35cdec4
|
3 |
+
size 29552640
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:569b08abb4169181a2c0498f40723960c08f618e6785a4f3d5572ccc34b20762
|
3 |
+
size 29542400
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c99a82b1b232bb3b76506940a8dfa36a57abeb3d3552686b810f68f51a929911
|
3 |
+
size 29562880
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2bb148a89a9b7b5ae317af6081e003b32f808c2a9bec518eb24946c512d2cbb
|
3 |
+
size 29552640
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:736e10e1524170ffdd1af4abe26a83d8a79c284ff33e3cd10a999a82565ccc72
|
3 |
+
size 29542400
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11cbe4fea4513d4d2a629b4f4959ad041156781d99601594d0edd639e03b1750
|
3 |
+
size 29542400
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0609aea4e7f6738993a2d6c7b3124c3bc6543821df416faefe52869be0ae5aae
|
3 |
+
size 29562880
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd458333beb80afd7e0322afcc1a5d89738ca9fc2eff885653fa6709c1dcdb46
|
3 |
+
size 29552640
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5843025273fbfe7e4b554fb9fe43ebf8aa7da819e646969cfe690220fde7e8f7
|
3 |
+
size 29542400
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9eb47acc04d72b9830c33e96a38ed221a92203f67800deac88a3c0c0b5363673
|
3 |
+
size 29562880
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7859ce118567f77904fed2e59c39e178eb9b80e3001c7e53dcd586ae06464203
|
3 |
+
size 29552640
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbb2bbe16c68fcefae08ddd755afa85645d527bbf8282e20e968dd9e841a0f8a
|
3 |
+
size 29542400
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f61d825835d0f607895429c4b57a0ab4182d61d729bd5a45e7bae6348763890
|
3 |
+
size 29562880
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f1e5363a86299c75231a30f28278a919340438d38428cb52c273d248178428f
|
3 |
+
size 29552640
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76de7aedcc93fd34f21d662efb0d4fa78568881c54f23dcccb2e9ab06d25d4df
|
3 |
+
size 64552960
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ee9f2f3d8328fb0f97c5b45560670e95903a2f91fd3570a6df80cd7aabddfcb
|
3 |
+
size 29562880
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba9e1f0730c6afcceee3970499e006d9731b428fa09ece273f011e5442a5846e
|
3 |
+
size 22835200
|