marcusguhao
commited on
Commit
•
70abd06
1
Parent(s):
a4cc2b7
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +83 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_6.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,83 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q3f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 3072,
|
7 |
+
"intermediate_size": 8192,
|
8 |
+
"num_attention_heads": 24,
|
9 |
+
"num_hidden_layers": 28,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": true,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": {
|
15 |
+
"factor": 32.0,
|
16 |
+
"high_freq_factor": 4.0,
|
17 |
+
"low_freq_factor": 1.0,
|
18 |
+
"original_max_position_embeddings": 8192,
|
19 |
+
"rope_type": "llama3"
|
20 |
+
},
|
21 |
+
"context_window_size": 131072,
|
22 |
+
"prefill_chunk_size": 8192,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"head_dim": 128,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"pipeline_parallel_stages": 1,
|
27 |
+
"max_batch_size": 128
|
28 |
+
},
|
29 |
+
"vocab_size": 128256,
|
30 |
+
"context_window_size": 131072,
|
31 |
+
"sliding_window_size": -1,
|
32 |
+
"prefill_chunk_size": 8192,
|
33 |
+
"attention_sink_size": -1,
|
34 |
+
"tensor_parallel_shards": 1,
|
35 |
+
"pipeline_parallel_stages": 1,
|
36 |
+
"temperature": 0.6,
|
37 |
+
"presence_penalty": 0.0,
|
38 |
+
"frequency_penalty": 0.0,
|
39 |
+
"repetition_penalty": 1.0,
|
40 |
+
"top_p": 0.9,
|
41 |
+
"tokenizer_files": [
|
42 |
+
"tokenizer.json",
|
43 |
+
"tokenizer_config.json"
|
44 |
+
],
|
45 |
+
"tokenizer_info": {
|
46 |
+
"token_postproc_method": "byte_level",
|
47 |
+
"prepend_space_in_encode": false,
|
48 |
+
"strip_space_in_decode": false
|
49 |
+
},
|
50 |
+
"conv_template": {
|
51 |
+
"name": "chatml",
|
52 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
53 |
+
"system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
54 |
+
"system_prefix_token_ids": null,
|
55 |
+
"add_role_after_system_message": true,
|
56 |
+
"roles": {
|
57 |
+
"user": "<|im_start|>user",
|
58 |
+
"assistant": "<|im_start|>assistant"
|
59 |
+
},
|
60 |
+
"role_templates": {
|
61 |
+
"user": "{user_message}",
|
62 |
+
"assistant": "{assistant_message}",
|
63 |
+
"tool": "{tool_message}"
|
64 |
+
},
|
65 |
+
"messages": [],
|
66 |
+
"seps": [
|
67 |
+
"<|im_end|>\n"
|
68 |
+
],
|
69 |
+
"role_content_sep": "\n",
|
70 |
+
"role_empty_sep": "\n",
|
71 |
+
"stop_str": [
|
72 |
+
"<|im_end|>"
|
73 |
+
],
|
74 |
+
"stop_token_ids": [
|
75 |
+
2
|
76 |
+
],
|
77 |
+
"function_string": "",
|
78 |
+
"use_function_calling": false
|
79 |
+
},
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"bos_token_id": 128000,
|
82 |
+
"eos_token_id": 128001
|
83 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:211bebfb70fb25d0c3220f65eb8a1b44127f247a6c4787a2d5ab9e97e29080df
|
3 |
+
size 158011392
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff5740ad84d9f2d0417bdba64b0000078e488d1397973abe2454af27d061cdcb
|
3 |
+
size 20185088
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da7fafc5a830089b9841f4cc8cedd95405d986a32474129aa1d26082007d623a
|
3 |
+
size 20185088
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abfc5ccf8c3ee5059af712dd2cff3dce404ad648ee1d53019f02b9031b3086d4
|
3 |
+
size 27754496
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bfb0d0a5def0b181f409b2939053924d4418eb81d6035594f2f913d12af14d1
|
3 |
+
size 20185088
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b48a53bcd2d90cdb2627f5c96da1f9f743dcb20d933e00418a2e9a3f217abe2b
|
3 |
+
size 32321536
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c74ff20411f14c82d9f19fd274f753b550b2254f51a9d3a5f0c81ea7bd3b9a9d
|
3 |
+
size 20185088
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27039f8ae8db236fd03d1bea2ec6ebde9d0d4e1b2b4255bce384ae4a0702af93
|
3 |
+
size 29489152
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3c0726c10b988c1286eae1dcc3c772827f1c57d2567c4151a5730759e9fc73b
|
3 |
+
size 31520768
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0750abec88fcdd88ebc2d62f0f9eceb9573ebe930e0c400f232c7d3c1919e5df
|
3 |
+
size 20185088
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e75d5274271e064c5320d437f16c0ca9134039b410e748111ca06325842adc2
|
3 |
+
size 27754496
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46f970d764371402cf739217d58c219e9323ba015ddc6f74496301c7efdbd367
|
3 |
+
size 20185088
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:644c9f17f34766f1a44cbfe4baebdfdc47467723d394e7c72c6509d7eb650439
|
3 |
+
size 31093248
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50152a608a8ca3b02c5a25fea87e24f688f8c6df96e2c2acb89d4c2ee8844507
|
3 |
+
size 32321536
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c9066e6ed88f2d6d2c3bffc3f376c90d05aee0a77c21daad9d82506024e9668
|
3 |
+
size 20185088
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:748a190dce73a4117d3daee8398fafee9ccaaff6ea955fdc3e20f44eb5c75bc7
|
3 |
+
size 29489152
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0830cb04ee2c6186b60d66a3cf973765676bd997755c22594d9ba0170611b38f
|
3 |
+
size 31520768
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8476c9119137be2ba8ad2263c81d7cf03deb36c4d482d2aad6139288a4b6ca82
|
3 |
+
size 20185088
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5918fd4f4bb6add98f8ad4226f62caaf3f5036ac746dd84066e0927f14785d39
|
3 |
+
size 27766784
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7709a160bfa47290af076e905db3712a90ef5c7ae9027d9080433e05fa261d4
|
3 |
+
size 31520768
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2225fb4c8dbc27c83d38834ca3f3230cc3292e9b4e673e2dc371dc505160cbfd
|
3 |
+
size 20185088
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:246b8590c53e720d5337ee56ac66e32e65524b33578e85603b5370fe5754b63f
|
3 |
+
size 27754496
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:707e8d53d9bbf3b103733f686b18c10f1a1920cb9705d23d1bdc7d1ed6790af7
|
3 |
+
size 20185088
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f23bf1612e7810cfe529ba49bb8163d48a65cd274504c5af6ca40781d474eafc
|
3 |
+
size 20185088
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbd419b2e3191e7a795f2bdbea8de9f199b371898c4f11349a23f77f3f959d40
|
3 |
+
size 32321536
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca4dc0a0bc52ab968ab6bb949fd6c3f396bd3dd46b37c68347b59620bc0262a0
|
3 |
+
size 20185088
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:451eb3183e36d62b0176aa42dec8f9c5965bb3dd5e29f1bab814135d81535e13
|
3 |
+
size 29489152
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f716d6748e44548df93c6c3be771268a6d1a5829d3f6100cd2286155632f86b6
|
3 |
+
size 31520768
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40996b0c748d1d704b936f60719a9ff92a989b556509065d293db722c7b935f9
|
3 |
+
size 20185088
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c664a38614f6e608d7520e9898140a73ed7642afe6e3130b9f8cc9ed6012dc0
|
3 |
+
size 27754496
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f16246e19eb20adf3663fa38883e929428d92fced301b3055f0a2adbf11783f
|
3 |
+
size 20185088
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a6ed38f719a3a9cf17404c280421c77d719534d82b66a7ecb0aebe227335590
|
3 |
+
size 32321536
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e88bd410c7227252538370678420ecfc967e084c33bb72c9c9a3bd57605f50f8
|
3 |
+
size 20185088
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac021a53d8456cd7f8c34e0dc0b7164304aaa1b41bb5b907172b5c651efce25c
|
3 |
+
size 29476864
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a832ecd181873e6723f15c2548c66413c937f9dbf8883670c1ef92108025a47
|
3 |
+
size 27754496
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45ef58257a813330ef63b8778b48537e4a205ed8e47ff85a012a614402468b1b
|
3 |
+
size 20185088
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6c36f0fd491d6173c4ef65b97720c1fdb690d719b30d235aed4b5131d0b121c
|
3 |
+
size 32321536
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f54a800eb7c5b56c3931f067c591ea7aa94f7727480a0209c247dfb4265370c
|
3 |
+
size 20185088
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77d4ae2439d5bb6ce0f8ba7e5524415136420e9f882f6c505586a6122afe0536
|
3 |
+
size 29489152
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:813167f8c3fbec821de923dcc964eb298074823e850a2ae12116c016a74818d0
|
3 |
+
size 31520768
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1aa08fb4b18ac7bd487d55ed198d62739d66a933fe8653382c360f146a7d65c8
|
3 |
+
size 20185088
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14ee58f43e3bd82e4b30713f376f34b013dae107b138ab685f6e2d1e46204f88
|
3 |
+
size 27754496
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbd76ec5c3c35c5fa9726eebfd07a254ae88ec0cdbbfa3a50b08b2f591bf9499
|
3 |
+
size 20185088
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:326be74ba1f0aefd3fb232e49c7acc1302bbb29184aea3faacb89e4e29fb5b77
|
3 |
+
size 32321536
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:360995cafce8cec908489bf3c1b4870b5aa01e7e0f16453e1d49ca91a38ea747
|
3 |
+
size 20185088
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16b7197f41abcb91030f089ecde8ba3e200c32ac7b02497599b6398b97b6e3cc
|
3 |
+
size 20185088
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:910585266da4ed405c7667ebc725a6046f43ac59be6ff0b7d95c2fa3e0421afd
|
3 |
+
size 29489152
|
params_shard_6.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:663c48a31bb48919dee535d189a238f4dd0e9b30eb7a437b2b6500d664e073f4
|
3 |
+
size 32321536
|