Add weigts and config
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +77 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_51.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f16_0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 26,
|
10 |
+
"rms_norm_eps": 1e-06,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"position_embedding_base": 10000,
|
13 |
+
"context_window_size": 2048,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 32,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 32000,
|
21 |
+
"context_window_size": 2048,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"mean_gen_len": 128,
|
27 |
+
"max_gen_len": 512,
|
28 |
+
"shift_fill_factor": 0.3,
|
29 |
+
"temperature": 0.6,
|
30 |
+
"presence_penalty": 0.0,
|
31 |
+
"frequency_penalty": 0.0,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 0.9,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"tokenizer.model",
|
36 |
+
"tokenizer_config.json",
|
37 |
+
"tokenizer.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_fallback",
|
41 |
+
"prepend_space_in_encode": true,
|
42 |
+
"strip_space_in_decode": true
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "st-llm",
|
46 |
+
"system_template": "Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.\n\n### Instruction:\n{MessagePlaceholders.SYSTEM.value}</s>",
|
47 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
48 |
+
"system_prefix_token_ids": null,
|
49 |
+
"add_role_after_system_message": true,
|
50 |
+
"roles": {
|
51 |
+
"user": "### Input:",
|
52 |
+
"assistant": "### Response:"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
"</s>"
|
62 |
+
],
|
63 |
+
"role_content_sep": "\n",
|
64 |
+
"role_empty_sep": "\n",
|
65 |
+
"stop_str": [
|
66 |
+
"</s>"
|
67 |
+
],
|
68 |
+
"stop_token_ids": [
|
69 |
+
2
|
70 |
+
],
|
71 |
+
"function_string": "",
|
72 |
+
"use_function_calling": false
|
73 |
+
},
|
74 |
+
"pad_token_id": 0,
|
75 |
+
"bos_token_id": 1,
|
76 |
+
"eos_token_id": 2
|
77 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efc6b584daf4fdfbd88efbaf9bd7fd5c8f2d5f4eb1567046317156af536f1a2b
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:803d7dcef7dbf789a0f7f74841d410c96e411b67de43897182be5efba3f1ca32
|
3 |
+
size 30744576
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a8d433b583eea228b869019b4f11069a075d8bc6218e0909a346e9ad4a3e92a
|
3 |
+
size 45088768
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23d396b31eff174210b09515417a3e13c3b7b0ac77a8593aa049a473b0b81691
|
3 |
+
size 25165824
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe019cd423bff25b9d350b8daa8b89a29a88237f78e3580b9ce3ff0c7f003392
|
3 |
+
size 29253632
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97092e6b320d0816e071e40c970f24506cb7c5c13305a9cb3f4508a3f04a7eb1
|
3 |
+
size 31989760
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:536f6ade2bfa2dd25f8ccc2d133cbd608b38afb49924a7f54df9d641eab9c2ae
|
3 |
+
size 45088768
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:776a0b4a0fa3d6cf54c16579a35b7db03afc000d7c51ef3badcbe89aa605f906
|
3 |
+
size 25165824
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40c1cd5d2c635455d55563586c3bf80941061f3e8c08315da2a039ab124633ce
|
3 |
+
size 22544384
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bd15baa3d320f3a74e65ab4b80a507b35f114c82b2be5642396c7880da8fc65
|
3 |
+
size 45088768
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4b2cece71d71cf43f61bde15cb731047dd7912fcfa783078f03bab2c4eadc0e
|
3 |
+
size 25165824
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:400af258882c42e58c310edc10bedf834dd85b46c916f159c90081825e39f5f5
|
3 |
+
size 32661504
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f92ede57aee53035083e0d87a8c0bc2f1811e95e429d6f589c2bf88640567372
|
3 |
+
size 45088768
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ee10dfc9f3dbcab42b3d803337b832ecb9c72cc92af0f4091331eda345aea56
|
3 |
+
size 31989760
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5f2d978ed0b3eb4abfd7907db88d343b8a3e223ca942366c76ccccdd33d78b1
|
3 |
+
size 45088768
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:641cc30202b544c947ccf8ab680c91d979a97296b6cb99036791819cdf730b88
|
3 |
+
size 25165824
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:841b5c6a96e836327aa7ef70ba731b2aa5985ff34441689470f1317529bda83f
|
3 |
+
size 22544384
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d548868ddf724c2abe72045cefac3fbac1a17143ef2808d0c0d367d1fe80c76b
|
3 |
+
size 45088768
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19924a346372a1b5e501dcf92a724f4b05f6168bbab98e3374a9f4983dff025f
|
3 |
+
size 25165824
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13526d9ffbbd2a7cd75e220a645f4086433ee3a27a85c41f989a62410530022c
|
3 |
+
size 32661504
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02a1b90197043325429d20b94d8c224cb816911c3e49c3924e2e9ed35c2377ae
|
3 |
+
size 31989760
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b350c124c1b652e6618a8832d6944fa35d90404f44add3612ec1a591193c3cc1
|
3 |
+
size 45088768
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7e3593f9a4a32a32e00ac6f721906e952e016d1d081ebb246cf7b5e2ef548d3
|
3 |
+
size 25165824
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae2fdd912388b19665bf1f81426d0433b7c37082383c71809d33fffa8697049f
|
3 |
+
size 25165824
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6afc925193917e62c1746929c358e172f5c8e487e34e44ded58d3a16d6420dea
|
3 |
+
size 22544384
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ec8a4896a49f3dd6f0cb9f2a8867d4498e1e9dbfd8fdfaeb981377ce6868def
|
3 |
+
size 45088768
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4ed45fb6d33f9811f1fe826c19e0015b4570d42c0c427bb4515649bc70b4216
|
3 |
+
size 25165824
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa3aecd7959e60567b306d07183c7c17c82fb36522dab158e699d87046a0a8c8
|
3 |
+
size 32661504
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfb50a25f63e7edc93131da847dc5d4c8aaf06ba1fa2c15a3ed1bf966fd7a31c
|
3 |
+
size 31989760
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:513284186e9d8ee26942701ba720f458e0ca817f833c317556ba1fbc770a92ab
|
3 |
+
size 45088768
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:143c4878e8c7c9bc205ceb019a1b37a2f6dc01ec8fed3548548f21eabe789196
|
3 |
+
size 25165824
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b317a6233769b6c850e9a0471fd4b126b6468ed0f30b2bab9df3d766742b69a8
|
3 |
+
size 22544384
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e5800d168ffb766d0dd311842060f1b42c25c1a3cbd59211c25732f85f85f37
|
3 |
+
size 45088768
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64ac4ad81eba8892ff3d4faed773f7623a9ecda37cedb4c4ca271e1332748085
|
3 |
+
size 25165824
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e77756b9e68d6a9846ac3d0f0e29844ed1c1965882eee3b5f53f205da7ebf94
|
3 |
+
size 22544384
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f3c6b2d53ce3a522f29cce947fd62e326ec44c586128897b99884a4fa239883
|
3 |
+
size 32661504
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65e389cf0e91650e285ef978925d26110f3947acc916c6b66b051f64ad9a0fcf
|
3 |
+
size 31989760
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:322805784f5af0d93175c3978c0859f17a53fa50ce2a33844a3c399ab47e4206
|
3 |
+
size 45088768
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb0033f05cc7dd260a40d22e22cb5dfb0c48f6b8466991f395a5d4fb67664239
|
3 |
+
size 25165824
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:634bbcdad97c16aa7c8bdf98606bb8d31e5018a4749606df5ed0be7f405ff133
|
3 |
+
size 22544384
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66b29c02bba99259d610fac040266b77eb0358e2b700c4fe5b882355bb54738e
|
3 |
+
size 45088768
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e75adcf4e5e4b62df2e9d4e38504ff8e3ac9e6b96a8d8fadc41bcce6fac8e9a
|
3 |
+
size 25165824
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa15aeff3a2be13f4c8c8ac60a8fe817de9755557da4b362ed5967fd70643812
|
3 |
+
size 32661504
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77319e63f9469e0fa0be766692bdd944102d98eb3f0ef1b41f58cafe20c0c2ce
|
3 |
+
size 31989760
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e336c3af55dc02b0e2a7cbdd0012482d1a2578adfcbd1e58f9075a10f61811f8
|
3 |
+
size 45088768
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35f44190761bfa94b646b1d6cce3ceee05cbdaa7cd86aa142e2e03bbf6edf3f4
|
3 |
+
size 45088768
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b3edbc89976c1c43f68d31cbc0a2890d680e813c59ed431d5d62370126f616a
|
3 |
+
size 25165824
|
params_shard_51.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34af4bb9c70f00782ee1ec9725d6230f77d98982f0a8809fa8192d01c2ec452e
|
3 |
+
size 22544384
|