ruihanglai
commited on
Commit
•
a523fc2
1
Parent(s):
b51d693
init
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +78 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_51.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q3f16_0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-06,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"position_embedding_base": 10000,
|
13 |
+
"context_window_size": 4096,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 32,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 32000,
|
21 |
+
"context_window_size": 4096,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"temperature": 0.6,
|
27 |
+
"presence_penalty": 0.0,
|
28 |
+
"frequency_penalty": 0.0,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 0.9,
|
31 |
+
"tokenizer_files": [
|
32 |
+
"tokenizer.model",
|
33 |
+
"tokenizer.json",
|
34 |
+
"tokenizer_config.json"
|
35 |
+
],
|
36 |
+
"tokenizer_info": {
|
37 |
+
"token_postproc_method": "byte_fallback",
|
38 |
+
"prepend_space_in_encode": true,
|
39 |
+
"strip_space_in_decode": true
|
40 |
+
},
|
41 |
+
"conv_template": {
|
42 |
+
"name": "llama-2",
|
43 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
|
44 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
45 |
+
"system_prefix_token_ids": [
|
46 |
+
1
|
47 |
+
],
|
48 |
+
"add_role_after_system_message": false,
|
49 |
+
"roles": {
|
50 |
+
"user": "<s>[INST]",
|
51 |
+
"assistant": "[/INST]",
|
52 |
+
"tool": "[INST]"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
" ",
|
62 |
+
" </s>"
|
63 |
+
],
|
64 |
+
"role_content_sep": " ",
|
65 |
+
"role_empty_sep": " ",
|
66 |
+
"stop_str": [
|
67 |
+
"[INST]"
|
68 |
+
],
|
69 |
+
"stop_token_ids": [
|
70 |
+
2
|
71 |
+
],
|
72 |
+
"function_string": "",
|
73 |
+
"use_function_calling": false
|
74 |
+
},
|
75 |
+
"pad_token_id": 0,
|
76 |
+
"bos_token_id": 1,
|
77 |
+
"eos_token_id": 2
|
78 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3987364d81690f49b161a1bfc5ec7599acd5e44383a74b7c7e2c954bb9843e3
|
3 |
+
size 52736000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5d6a9f7b1f64fdb87b236caff4c444cbd7878279bfcc0508fc9b62418077c3c
|
3 |
+
size 36282368
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f375b9bed8d1c06cfe452d1c0601f394bdb316de990e620fc215416602c8599
|
3 |
+
size 36282368
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a143b08ff2a1d2c79fb76767e182fb3cbcd272ce415da103026035615692286d
|
3 |
+
size 30482432
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7689983fc5dd4d475763f52a3e4413426f7a25e4f1834d2312fbc2a22e92a9c0
|
3 |
+
size 27325440
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c8fb83fd5c1db1b5a0546705ab6da3dd1ad75b352860decd4cd9bc0dd887ca0
|
3 |
+
size 36282368
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebc66c3b14d8fb0bbefd40ddabf498fc6b1976860b46a784b84ff196fc8041a8
|
3 |
+
size 20250624
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c57591a197000ca3666bce336dd0ee2e47a1bd4ce0a26ca047cc47ae0bb332e
|
3 |
+
size 32494592
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3818bee81b9068e59465c5f76adf22de30a6afb024b290784a9a11492fca1c3a
|
3 |
+
size 36282368
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d3168b092898bf5f9fd1ff75207ea7165d4bfdb7dcc22ab8c8c90a412e5eb98
|
3 |
+
size 30482432
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c5efd5386db4bb83881213f7158662bbf32c1261b74bfa0e573428f5b1ea64c
|
3 |
+
size 27325440
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51b6c02ae8ad1859a67f3fb9f52e446433615b0b2570c6ca4f563bcf4795a980
|
3 |
+
size 36282368
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:896252b8c31a1b3182632ce5a7a2ed5280110115fbaba800cdbdc7ef0d7a0e8e
|
3 |
+
size 20250624
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02b5e633002b3fddd7bcb4142f80f5fbb43c4260ccd6fc587df5c2f4c96b21f8
|
3 |
+
size 20250624
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e13d42020340d4fde73a0dc908e365d0e8b2d3c4022603cd62f13223e36bbdc
|
3 |
+
size 32494592
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:874b200b0c1f2869f06d77b760b5b9c9d37642272ecc51f268ba9181482d6a99
|
3 |
+
size 36282368
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:523231e58dc5e0938f66d492ef94f03e68935bfb5a2fd6ab6dc914b7bd35d516
|
3 |
+
size 30482432
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f05f7fd8aedbac09a55af7abfb2d2a6c273d54cc7cf1146046b961afeab006d
|
3 |
+
size 27325440
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38b775547675408b2217f9418eb1acd66e002e496907a44174028b14677b02ad
|
3 |
+
size 52736000
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d3a28b6759cdf6d07d350f250a88099ba9eb63aae91ee6f8184adea2d40eb33
|
3 |
+
size 32290304
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a4b17799f79ac2a4e807744e25672ffee89f24216d57acb8c6ae765e8682405
|
3 |
+
size 36282368
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5aba910c82a41052bc5c964b333888be0c7cf2305a1d2e8e44a32e699e0e5503
|
3 |
+
size 29586432
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d464448a140e56a1b11d90144bbb4cb5d12ba77595e5ded3490f98d58e66c4b
|
3 |
+
size 36282368
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f697ddd17bc6d3edaf9d7b1365effc99c08dddab21470fff93f25311f522edb4
|
3 |
+
size 31492608
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a73e9cd09f58165ada95b9cf9a7f9aba7c13c7b0a0acab1348fb93eaceaeaa7
|
3 |
+
size 20250624
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:deb7cbe2b8ef865e4c340759764ddc7a4629a92a27cb7c106e3b990c53e3ef8d
|
3 |
+
size 32494592
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5481131a0bb1bcc7b5a221627fad53dc0c2b911fe9213d6323412f891d22cd1b
|
3 |
+
size 36282368
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd148f9222c2ac018c1740fe68201565890c0de82b47cde80a9f80eee3d72bcd
|
3 |
+
size 30482432
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c14b2c86f01ffb5da7dce37ab8b5ed24878282fa45779bb0c6e99a5da75e3ba
|
3 |
+
size 27325440
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a1ba639e7314bb9e7f8b73e127724a8b647c826cef8cf3ebbff0fe959115ab1
|
3 |
+
size 36282368
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c21669b660714277376614b842262878bdc2c265d5d00f51ef11f07779569bdb
|
3 |
+
size 20250624
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:451c626439245cd9dd4e4eca810a07e3b1171d16c92f08f6f654a778b747ffff
|
3 |
+
size 32494592
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b65041c60ffd54e55f818de472535ecae391acd18a977cd91ce8bd48d312ad17
|
3 |
+
size 36282368
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e730a2a535840633e3cdefdfec309f78a7011d515691a078ecd176a6d9e32534
|
3 |
+
size 30482432
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:774851a8dd54cc06a68f81deac747ca92979aa49563394cce70f5d6a07e1e1de
|
3 |
+
size 36282368
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdfebb6c176f97465ecbb6fe568ccadb60b22569c8280912a92e2168304914da
|
3 |
+
size 27325440
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4371636ac237d6c35f57ff4a44917401cd1e816f8285a40254ab6f6a5ba4f79
|
3 |
+
size 36282368
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d8729dee66005a8c52825d4a02b419a18a8c123c1880bc005d40182ed71ab29
|
3 |
+
size 20250624
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdc5de65bb0fb79a18427b8ae2cd4dfa4c4dbd800c77bffde7f1978c50bf6b6c
|
3 |
+
size 32494592
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:820bbd5880b88fd9479e0ce2b80b9173ad54172ab0afda10af32fc8e0cd09534
|
3 |
+
size 36282368
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca5207b88425902012e866ffc1541c6503b37a119c7186b36a452d8a9bd119ae
|
3 |
+
size 30482432
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42c02d04a4e2a89fc37112b5a21ff3c0da26dafb0ee6d321282c0f3cf4a46ffe
|
3 |
+
size 27325440
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aba3175520dc8db8059efd1a9a261c734aed9227e74bff5082c9e675b93ec684
|
3 |
+
size 36282368
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59a1c6537a4e427a99c6441189740a2c4fcf6f3726c9c8c88910b6abbb09beba
|
3 |
+
size 20250624
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beafff30299771e2d84751d013011488d341f8a8e1265a75727584a67d379bde
|
3 |
+
size 32494592
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:069cdff1af78a6489173357371d267698dbc595eb70f738ec11f8b513f9cf6c4
|
3 |
+
size 30482432
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2ec1ee2b0cb25307667831a9b3c1261a697d3a5ddfa1c5a7a3a793158f26ba1
|
3 |
+
size 36282368
|
params_shard_51.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e512e05dd6f8d35c1bceabcb71aaa799d048ebd9cd4fd0021b98a0378b7becec
|
3 |
+
size 30482432
|