Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +80 -0
- ndarray-cache.json +0 -0
- params_shard_143.bin +3 -0
- params_shard_149.bin +3 -0
- params_shard_151.bin +3 -0
- params_shard_153.bin +3 -0
- params_shard_154.bin +3 -0
- params_shard_155.bin +3 -0
- params_shard_156.bin +3 -0
- params_shard_157.bin +3 -0
- params_shard_158.bin +3 -0
- params_shard_159.bin +3 -0
- params_shard_160.bin +3 -0
- params_shard_161.bin +3 -0
- params_shard_162.bin +3 -0
- params_shard_163.bin +3 -0
- params_shard_164.bin +3 -0
- params_shard_165.bin +3 -0
- params_shard_166.bin +3 -0
- params_shard_167.bin +3 -0
- params_shard_168.bin +3 -0
- params_shard_169.bin +3 -0
- params_shard_170.bin +3 -0
- params_shard_171.bin +3 -0
- params_shard_172.bin +3 -0
- params_shard_173.bin +3 -0
- params_shard_174.bin +3 -0
- params_shard_175.bin +3 -0
- params_shard_176.bin +3 -0
- params_shard_177.bin +3 -0
- params_shard_178.bin +3 -0
- params_shard_179.bin +3 -0
- params_shard_180.bin +3 -0
- params_shard_181.bin +3 -0
- params_shard_182.bin +3 -0
- params_shard_183.bin +3 -0
- params_shard_184.bin +3 -0
- params_shard_185.bin +3 -0
- params_shard_186.bin +3 -0
- params_shard_187.bin +3 -0
- params_shard_188.bin +3 -0
- params_shard_189.bin +3 -0
- params_shard_190.bin +3 -0
- params_shard_191.bin +3 -0
- params_shard_192.bin +3 -0
- params_shard_193.bin +3 -0
- params_shard_194.bin +3 -0
- params_shard_195.bin +3 -0
- params_shard_196.bin +3 -0
- params_shard_197.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 8192,
|
7 |
+
"intermediate_size": 28672,
|
8 |
+
"num_attention_heads": 64,
|
9 |
+
"num_hidden_layers": 80,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 6315088.0,
|
14 |
+
"rope_scaling": null,
|
15 |
+
"context_window_size": 32768,
|
16 |
+
"prefill_chunk_size": 8192,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"head_dim": 128,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"pipeline_parallel_stages": 1,
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 128256,
|
24 |
+
"context_window_size": 32768,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 8192,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 1.0,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 1.0,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_level",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "llama-3_1",
|
46 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
|
47 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
48 |
+
"system_prefix_token_ids": [
|
49 |
+
128000
|
50 |
+
],
|
51 |
+
"add_role_after_system_message": true,
|
52 |
+
"roles": {
|
53 |
+
"user": "<|start_header_id|>user",
|
54 |
+
"assistant": "<|start_header_id|>assistant",
|
55 |
+
"tool": "<|start_header_id|>ipython"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
"<|eot_id|>"
|
65 |
+
],
|
66 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
67 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
68 |
+
"stop_str": [],
|
69 |
+
"stop_token_ids": [
|
70 |
+
128001,
|
71 |
+
128008,
|
72 |
+
128009
|
73 |
+
],
|
74 |
+
"function_string": "",
|
75 |
+
"use_function_calling": false
|
76 |
+
},
|
77 |
+
"pad_token_id": 0,
|
78 |
+
"bos_token_id": 128000,
|
79 |
+
"eos_token_id": 128001
|
80 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_143.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82d55b400e071ade4a2c2ed1d118972891b05cc6e45a2f95737be109ee6f52ed
|
3 |
+
size 234881024
|
params_shard_149.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56cc1494ebd3ae625042b3bdfa1da7897504731b3941b9ccbb9df52275d10677
|
3 |
+
size 117440512
|
params_shard_151.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ccf246bc87fe3d7efe5521e2812dd91f9463ca67f731884b694332411c2aed9
|
3 |
+
size 234881024
|
params_shard_153.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37a87cdbbe666aa5a536077de90ff477742e956588ec70ac23e1873a6c4de456
|
3 |
+
size 41943040
|
params_shard_154.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5f8d90de98863c9d5a697074ca5efa04357ce372ff7e29de179f864853caa6f
|
3 |
+
size 33554432
|
params_shard_155.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb196c6dddb67e2da1bd75be0c1a6f207d7d4b71393bf4fbcde0f7906c09d7cc
|
3 |
+
size 117440512
|
params_shard_156.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a42f72cc97bcc58192fb62d33bea72a3009738f71950ac6c09e4cdb99608482e
|
3 |
+
size 24150016
|
params_shard_157.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7ee0ae12bde72e184c2ee5720b3c05a672be8a2c7744c694936ecc68bc1e04d
|
3 |
+
size 234881024
|
params_shard_158.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dab45cfafcefda8e820a79cce0b6310cad99133b620a49f9d37af42447106b5a
|
3 |
+
size 29360128
|
params_shard_159.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:353200dacc84a8ccb2e799f2c67317737b81487c25cf826f56a3197401c69757
|
3 |
+
size 41943040
|
params_shard_160.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f2fa77c8f26ba835d28fd272ae8f64c9f9d3046af5462ae8b08dd770d0a21b4
|
3 |
+
size 33554432
|
params_shard_161.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75c286acb42d59ef2510561085d63ad5592ccda76c550f3c077d836f71ad6fab
|
3 |
+
size 41943040
|
params_shard_162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4f3fbad36cdcc17bca1cdba13cc847d25713fc0d8382766c5efb8ac1668a947
|
3 |
+
size 33554432
|
params_shard_163.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:001e7aa58e861d888069d353d557254318e07ba3356cbbbf841fe439eb9f52a9
|
3 |
+
size 29376512
|
params_shard_164.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:680375eec62e7d47786e01655e7a28c29225658c76d35902f0a98ffa3b3b229e
|
3 |
+
size 117440512
|
params_shard_165.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:288f31f447159f7798cce158e7b6375530934d86a3ca3431c4145043fa6121d1
|
3 |
+
size 234881024
|
params_shard_166.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7563110415ead3d6c2af4a5c215ca13869d61b98251f7925754f331d0d2482b9
|
3 |
+
size 29360128
|
params_shard_167.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2515781cef68ac4b79d28e27cdc3f0298f52fa03fd7dda15aa7c2fbf54e7c3c
|
3 |
+
size 117440512
|
params_shard_168.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6558bf28f7fc6cc4d88eef86c8fbf985a58f821246f53c2d71c89cec39bd8fa9
|
3 |
+
size 18923520
|
params_shard_169.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90631c7949caedb176e47f7328789209f1696ac96c4545a8921d850d265d7cb7
|
3 |
+
size 234881024
|
params_shard_170.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c02310002e4b253949d871afd4b1b65593f475b9f776654375e24840a0151856
|
3 |
+
size 29360128
|
params_shard_171.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:453e24c7d53b74d384d2a1c369abff6aa68deaa212d3e73143de2ba13314ecbc
|
3 |
+
size 41943040
|
params_shard_172.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a926b27239f1582a9c18702d38d252235f57fbe54b402ccea9254afb78157a3b
|
3 |
+
size 33554432
|
params_shard_173.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0cf536bfda4f268ebbb859010a9c4d0ddfdbfcd92f5ca814927b471d5251c4b
|
3 |
+
size 117440512
|
params_shard_174.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4443cb30fb7e4587de66c2e9f475f2b974b4ca50d5fc72ccc01540af33ce9e6c
|
3 |
+
size 24150016
|
params_shard_175.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74605df174706e200e68fa7748e2e884f871a8083565f8b8f44fed273db1b07c
|
3 |
+
size 234881024
|
params_shard_176.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9ca63070ab93258d88bbc9957ec55b9998f292b66a6563bdac947a6ff9b6dff
|
3 |
+
size 29360128
|
params_shard_177.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc2db2eb47dbee919f1e77bef14ba1b71f5a2b0038f2fb84b9410fb9dd0fa961
|
3 |
+
size 41943040
|
params_shard_178.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25aa00af65ed44443bf5a108a69511f61aedb41e94090864698c878f9ce908b1
|
3 |
+
size 33554432
|
params_shard_179.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a75d7ab0d947646becd73aae959410d22a6d4004c2fcf795cbda6e1a18c6157d
|
3 |
+
size 41943040
|
params_shard_180.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a117f754ff8aefdb260553fa4129a42f6ee9f1a63e5e77191e28d366177e01e3
|
3 |
+
size 117440512
|
params_shard_181.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:927909d6dad349f6aeaa2cfb89e16b076379d773d04892842609283cd708b797
|
3 |
+
size 29392896
|
params_shard_182.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d09a29e3dffd84a2cdb15e89bc2bf53f8634c9cfd3c771cdd6807c09bbe0f4f
|
3 |
+
size 234881024
|
params_shard_183.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e9460332dc34e4b80e85bb772961fd8344e76f1373cf49b3036dbab113d0e4b
|
3 |
+
size 29360128
|
params_shard_184.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc39df5d11f30044789fbe90b840775b72356a2c49284cf9d04725d168c3c682
|
3 |
+
size 33554432
|
params_shard_185.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab4cfef4c7676b937dafad8fd04664e9686dbf5c48a0afcd33d172acf7140fe4
|
3 |
+
size 117440512
|
params_shard_186.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08a41500c76e9e3fec207c3beffff7a8e1f3dbfbfefa16e0f9d3a550f210cfae
|
3 |
+
size 18907136
|
params_shard_187.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae36b4a501145636424ea26d762181270fe86f1c0e1357b6a31aaa58c0397e73
|
3 |
+
size 234881024
|
params_shard_188.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce53e62d9623c5d54880af8eb1eb6b4896d5c336e16bbbc88aa3a70d926b4a07
|
3 |
+
size 29360128
|
params_shard_189.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73f5d57522d0078b7ea7b682619d33138cda43b88b0bca29c4131ae0b25190f0
|
3 |
+
size 41943040
|
params_shard_190.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f345454a23ce7a692c768db7fde18331f91ed2e169fff9122ca290f77636c2eb
|
3 |
+
size 33554432
|
params_shard_191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73865b3b087d361f305f50e9bc5725d7c7ca5d39e34891e4e377f64beddb9136
|
3 |
+
size 117440512
|
params_shard_192.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a106d6f372270430ea344d6b0edd9ccc0f582dad2436fd40afbae66e93e10236
|
3 |
+
size 24150016
|
params_shard_193.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:782e81e69d8cbbcbf7f21c5d8203681a51270ae48652b4662d3d46993b34903c
|
3 |
+
size 234881024
|
params_shard_194.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dfb99e3f4ae14a69ed6f4028241961992290f78c9a943367995c5a43b6bb1ca
|
3 |
+
size 29360128
|
params_shard_195.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc744efc0eead6da43a5414b00b5f922cab3ef7e7f288050242c4bdf2a799f94
|
3 |
+
size 41943040
|
params_shard_196.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb96c97cde65ab51fdd8ef7387452689636e28e5bdbaa2d47966c926d3066d69
|
3 |
+
size 33554432
|
params_shard_197.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfd4b25600e1ae5f50cbab8ae6d6fb4bfbe7a5d8f5f693222917ec86bcea219d
|
3 |
+
size 117440512
|