Add weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +16 -0
- config.json +5 -0
- merges.txt +0 -0
- mlc-chat-config.json +80 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
README.md
CHANGED
@@ -1,3 +1,19 @@
|
|
1 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2 |
license: apache-2.0
|
|
|
|
|
|
|
|
|
3 |
---
|
|
|
|
|
|
1 |
---
|
2 |
+
language:
|
3 |
+
- en
|
4 |
+
- fr
|
5 |
+
- de
|
6 |
+
- es
|
7 |
+
- it
|
8 |
+
- pt
|
9 |
+
- ru
|
10 |
+
- zh
|
11 |
+
- ja
|
12 |
license: apache-2.0
|
13 |
+
base_model: mistralai/Mistral-Nemo-Instruct-2407
|
14 |
+
base_model_relation: quantized
|
15 |
+
library_name: mlc-llm
|
16 |
+
pipeline_tag: text-generation
|
17 |
---
|
18 |
+
|
19 |
+
4-bit [OmniQuant](https://arxiv.org/abs/2308.13137) quantized version of [Mistral-Nemo-Instruct-2407](https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407).
|
config.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"quantization_config": {
|
3 |
+
"bits": 4
|
4 |
+
}
|
5 |
+
}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mistral",
|
4 |
+
"quantization": "w4a16g128",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 5120,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 131072,
|
12 |
+
"position_embedding_base": 1000000.0,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"context_window_size": 8192,
|
16 |
+
"sliding_window_size": -1,
|
17 |
+
"prefill_chunk_size": 128,
|
18 |
+
"attention_sink_size": 4,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 128
|
21 |
+
},
|
22 |
+
"vocab_size": 131072,
|
23 |
+
"context_window_size": 8192,
|
24 |
+
"sliding_window_size": -1,
|
25 |
+
"prefill_chunk_size": 128,
|
26 |
+
"attention_sink_size": 4,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"pipeline_parallel_stages": 1,
|
29 |
+
"temperature": 1.0,
|
30 |
+
"presence_penalty": 0.0,
|
31 |
+
"frequency_penalty": 0.0,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 1.0,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"vocab.json",
|
36 |
+
"merges.txt",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_fallback",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "mistral_default",
|
46 |
+
"system_template": "[INST] {system_message}",
|
47 |
+
"system_message": "Always assist with care, respect, and truth. Respond with utmost utility yet securely. Avoid harmful, unethical, prejudiced, or negative content. Ensure replies promote fairness and positivity.",
|
48 |
+
"system_prefix_token_ids": [
|
49 |
+
1
|
50 |
+
],
|
51 |
+
"add_role_after_system_message": false,
|
52 |
+
"roles": {
|
53 |
+
"user": "[INST]",
|
54 |
+
"assistant": "[/INST]",
|
55 |
+
"tool": "[INST]"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
" "
|
65 |
+
],
|
66 |
+
"role_content_sep": " ",
|
67 |
+
"role_empty_sep": "",
|
68 |
+
"stop_str": [
|
69 |
+
"</s>"
|
70 |
+
],
|
71 |
+
"stop_token_ids": [
|
72 |
+
2
|
73 |
+
],
|
74 |
+
"function_string": "",
|
75 |
+
"use_function_calling": false
|
76 |
+
},
|
77 |
+
"pad_token_id": 0,
|
78 |
+
"bos_token_id": 1,
|
79 |
+
"eos_token_id": 2
|
80 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0671f0173c49bb84ef7f86712e331b571daf808e508743ca00123fa042172b6
|
3 |
+
size 335544320
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3aa798c4eb108b870d83cc3092a05f8210de24dec79f9757037e1285be2a5a5
|
3 |
+
size 36700160
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f091b0991ac41259584a7316fe4faae4a7b155bc810b7354a7ca69b86be288a
|
3 |
+
size 73400320
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:052fd930e3603e45e910abee6ec5ad612532aec7324195b55831f8923129bee1
|
3 |
+
size 36700160
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b732fda78155066addbe226d7a962e853fce9164769658318113e136cf8595ce
|
3 |
+
size 73400320
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e4435ea1a606764dc1eb864445a6ec0c7d067d26f884846237f9295dce45290
|
3 |
+
size 30494720
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6ffcf42914818ff25e6a5a24150813e1a0d228a7b6f02361c18296750655ca7
|
3 |
+
size 36700160
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:788eec42b6947cccfe747981edd85bec7d37865531a3e79feec91d5b5c562edc
|
3 |
+
size 73400320
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69dc2780c62b61090c76ab8c93f2927f7de54e7b433d67b4ced4e1d0a36f80d6
|
3 |
+
size 30494720
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b948e688e7803163468550561faacc25c93306535c7316a911c3d1cc4f75e0a
|
3 |
+
size 36700160
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faa211970732761b0e242d5ae6bad6a0803418da22cc5512481f6e21c6944137
|
3 |
+
size 73400320
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc483edb98da56f5aefcf907a5448d88a601b3116ed75eeefa28ac4a06bab593
|
3 |
+
size 30494720
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80b152dcbf109430be053e80c31c2bcf7daa3191a5ffd1c054efe1a3b76fdfb7
|
3 |
+
size 36700160
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ef2258af91d105dafc35bf38adf36b8ad1826ac28e98a9df3fc396cc91fe739
|
3 |
+
size 30494720
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce65dd5c8b113b2b30e76a8e4e300c0123f0c443de0b0b003a0e1382fc286bb6
|
3 |
+
size 73400320
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad037ffa8d6924656e312344183b0d420ff9293b6343b159e73f7b88377677f6
|
3 |
+
size 30494720
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d827c5a6931f84ba7ca95ad289d26fc724aad18a1de813b872c651da5be2ae87
|
3 |
+
size 36700160
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad11115a410a1185eb377e76c338c054e3df719313037a12de7945c2f9b092ed
|
3 |
+
size 73400320
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7737424a2e952198d2fe5c91e06f6c836049b9feff1cc71be5fd35f2679689d6
|
3 |
+
size 30494720
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed248b0d7952423a5c4016bae161d7f5db7502a36734cf7d29a2c432bf0bc80c
|
3 |
+
size 36700160
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a318f492b7bee129447950b9fe9447c0395f0c8a4e19943f0bea5143e01864c0
|
3 |
+
size 73400320
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5131e530aeb9851324560e69b9d79be212ac54d24ef68fef95f8f61b05565dc1
|
3 |
+
size 30494720
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7111e7f0f1b5a5429a78ed7c10fd0fac9968e56d7b330f4a405071a7c8bd32c7
|
3 |
+
size 36700160
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:568aa5098d890e6850c9b0ed7ede711bad2438e0718e162d2249cd8dcf1bb673
|
3 |
+
size 73400320
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7cad449b8068c7d61c647eeadd55f722adb0365a5606121be19ec95dff8e46c
|
3 |
+
size 36700160
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c603323ebe0e6af014639ee9b3659914d83b0779a263be51aa045a612ad1d776
|
3 |
+
size 30494720
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2859ecf27080e478627cab50b78db1ca4f3918908b61d114952420a6bfcca40
|
3 |
+
size 27033600
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57d6844e6ed9acfc424464dd18302b0a44b653692aaa2086ee797365a2334a06
|
3 |
+
size 27033600
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6afa59d80288dfb4c18a61221be939d245cee60271c3bc1817463a2d13046bf4
|
3 |
+
size 73400320
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68143c2c28787595bd0e1f716ba8bca7f2cd508c373df21da1f7e63875f76ba3
|
3 |
+
size 30494720
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:729c5a1d79848dffd9d29531a88a08991877edc18896288dcf2737cee1fa97fa
|
3 |
+
size 36700160
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac043e43c896308cd3c65f6c9ea84268571b2942e866ff60cb73bc625dd4c03e
|
3 |
+
size 73400320
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d9a0e9ef1cad1fb5b08fef5d83b45a10ae7e437b70f17cec4496389710ceb50
|
3 |
+
size 30494720
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcf295e9963d9796234a52101af54cce247074127f5338a6a458b9998782bf7c
|
3 |
+
size 36700160
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:104866d8cbe1c863ff6c09e0e7cb1d5fca9d1ba711cfd802d73c22aa58a0224f
|
3 |
+
size 73400320
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae2484c5a09d8eb5799684e71d99e97827e6ede847a5c9d93dc7b2b60b690d5d
|
3 |
+
size 73400320
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b736c09ec99249ec01abc68353851ab1c6781639b601e43b890684b824b11507
|
3 |
+
size 30494720
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c2c83496cad9aaffdc28255771ced19a5fa10ba1f0bbcb01918c8ff1b6a5f09
|
3 |
+
size 335544320
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79866085d41f512702c155ff567e3b1c2036c3a835c8718d7b65b9747708af28
|
3 |
+
size 36700160
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4d3f3b57ec0c8248001cb14bb3aacce3f9288555db080f9146d5bb25d4308a1
|
3 |
+
size 73400320
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd7855dcdbcef1df48b76c8be33872228b53d0478132810c8d29b74e3f0c470f
|
3 |
+
size 24770560
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d9fd149e3f4bbc9a999c0eece952d2c72de6e2ae4c93ed70b1660530d49e443
|
3 |
+
size 36700160
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef69c922eb44ccbeaef4319db53c057ade07d9b04208abba5241130db64ed904
|
3 |
+
size 73400320
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8fc54260bfc8b143549371dd6ed9ce0fac7375523381f093a5d7e102215d8a8
|
3 |
+
size 30494720
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ab4906d04156736b0c48f9f57471260c71199f26e8c29e880dd3ca5b126de47
|
3 |
+
size 36700160
|