Jeethu commited on
Commit
e7d54dd
1 Parent(s): 904fdb1

Add weights

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
README.md CHANGED
@@ -1,3 +1,19 @@
1
  ---
 
 
 
 
 
 
 
 
 
 
2
  license: apache-2.0
 
 
 
 
3
  ---
 
 
 
1
  ---
2
+ language:
3
+ - en
4
+ - fr
5
+ - de
6
+ - es
7
+ - it
8
+ - pt
9
+ - ru
10
+ - zh
11
+ - ja
12
  license: apache-2.0
13
+ base_model: mistralai/Mistral-Nemo-Instruct-2407
14
+ base_model_relation: quantized
15
+ library_name: mlc-llm
16
+ pipeline_tag: text-generation
17
  ---
18
+
19
+ 4-bit [OmniQuant](https://arxiv.org/abs/2308.13137) quantized version of [Mistral-Nemo-Instruct-2407](https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407).
config.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "quantization_config": {
3
+ "bits": 4
4
+ }
5
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "mistral",
4
+ "quantization": "w4a16g128",
5
+ "model_config": {
6
+ "hidden_size": 5120,
7
+ "intermediate_size": 14336,
8
+ "num_attention_heads": 32,
9
+ "num_hidden_layers": 40,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 131072,
12
+ "position_embedding_base": 1000000.0,
13
+ "num_key_value_heads": 8,
14
+ "head_dim": 128,
15
+ "context_window_size": 8192,
16
+ "sliding_window_size": -1,
17
+ "prefill_chunk_size": 128,
18
+ "attention_sink_size": 4,
19
+ "tensor_parallel_shards": 1,
20
+ "max_batch_size": 128
21
+ },
22
+ "vocab_size": 131072,
23
+ "context_window_size": 8192,
24
+ "sliding_window_size": -1,
25
+ "prefill_chunk_size": 128,
26
+ "attention_sink_size": 4,
27
+ "tensor_parallel_shards": 1,
28
+ "pipeline_parallel_stages": 1,
29
+ "temperature": 1.0,
30
+ "presence_penalty": 0.0,
31
+ "frequency_penalty": 0.0,
32
+ "repetition_penalty": 1.0,
33
+ "top_p": 1.0,
34
+ "tokenizer_files": [
35
+ "vocab.json",
36
+ "merges.txt",
37
+ "tokenizer_config.json"
38
+ ],
39
+ "tokenizer_info": {
40
+ "token_postproc_method": "byte_fallback",
41
+ "prepend_space_in_encode": false,
42
+ "strip_space_in_decode": false
43
+ },
44
+ "conv_template": {
45
+ "name": "mistral_default",
46
+ "system_template": "[INST] {system_message}",
47
+ "system_message": "Always assist with care, respect, and truth. Respond with utmost utility yet securely. Avoid harmful, unethical, prejudiced, or negative content. Ensure replies promote fairness and positivity.",
48
+ "system_prefix_token_ids": [
49
+ 1
50
+ ],
51
+ "add_role_after_system_message": false,
52
+ "roles": {
53
+ "user": "[INST]",
54
+ "assistant": "[/INST]",
55
+ "tool": "[INST]"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ " "
65
+ ],
66
+ "role_content_sep": " ",
67
+ "role_empty_sep": "",
68
+ "stop_str": [
69
+ "</s>"
70
+ ],
71
+ "stop_token_ids": [
72
+ 2
73
+ ],
74
+ "function_string": "",
75
+ "use_function_calling": false
76
+ },
77
+ "pad_token_id": 0,
78
+ "bos_token_id": 1,
79
+ "eos_token_id": 2
80
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0671f0173c49bb84ef7f86712e331b571daf808e508743ca00123fa042172b6
3
+ size 335544320
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3aa798c4eb108b870d83cc3092a05f8210de24dec79f9757037e1285be2a5a5
3
+ size 36700160
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f091b0991ac41259584a7316fe4faae4a7b155bc810b7354a7ca69b86be288a
3
+ size 73400320
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:052fd930e3603e45e910abee6ec5ad612532aec7324195b55831f8923129bee1
3
+ size 36700160
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b732fda78155066addbe226d7a962e853fce9164769658318113e136cf8595ce
3
+ size 73400320
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e4435ea1a606764dc1eb864445a6ec0c7d067d26f884846237f9295dce45290
3
+ size 30494720
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6ffcf42914818ff25e6a5a24150813e1a0d228a7b6f02361c18296750655ca7
3
+ size 36700160
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:788eec42b6947cccfe747981edd85bec7d37865531a3e79feec91d5b5c562edc
3
+ size 73400320
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69dc2780c62b61090c76ab8c93f2927f7de54e7b433d67b4ced4e1d0a36f80d6
3
+ size 30494720
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b948e688e7803163468550561faacc25c93306535c7316a911c3d1cc4f75e0a
3
+ size 36700160
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faa211970732761b0e242d5ae6bad6a0803418da22cc5512481f6e21c6944137
3
+ size 73400320
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc483edb98da56f5aefcf907a5448d88a601b3116ed75eeefa28ac4a06bab593
3
+ size 30494720
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80b152dcbf109430be053e80c31c2bcf7daa3191a5ffd1c054efe1a3b76fdfb7
3
+ size 36700160
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ef2258af91d105dafc35bf38adf36b8ad1826ac28e98a9df3fc396cc91fe739
3
+ size 30494720
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce65dd5c8b113b2b30e76a8e4e300c0123f0c443de0b0b003a0e1382fc286bb6
3
+ size 73400320
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad037ffa8d6924656e312344183b0d420ff9293b6343b159e73f7b88377677f6
3
+ size 30494720
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d827c5a6931f84ba7ca95ad289d26fc724aad18a1de813b872c651da5be2ae87
3
+ size 36700160
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad11115a410a1185eb377e76c338c054e3df719313037a12de7945c2f9b092ed
3
+ size 73400320
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7737424a2e952198d2fe5c91e06f6c836049b9feff1cc71be5fd35f2679689d6
3
+ size 30494720
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed248b0d7952423a5c4016bae161d7f5db7502a36734cf7d29a2c432bf0bc80c
3
+ size 36700160
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a318f492b7bee129447950b9fe9447c0395f0c8a4e19943f0bea5143e01864c0
3
+ size 73400320
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5131e530aeb9851324560e69b9d79be212ac54d24ef68fef95f8f61b05565dc1
3
+ size 30494720
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7111e7f0f1b5a5429a78ed7c10fd0fac9968e56d7b330f4a405071a7c8bd32c7
3
+ size 36700160
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:568aa5098d890e6850c9b0ed7ede711bad2438e0718e162d2249cd8dcf1bb673
3
+ size 73400320
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7cad449b8068c7d61c647eeadd55f722adb0365a5606121be19ec95dff8e46c
3
+ size 36700160
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c603323ebe0e6af014639ee9b3659914d83b0779a263be51aa045a612ad1d776
3
+ size 30494720
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2859ecf27080e478627cab50b78db1ca4f3918908b61d114952420a6bfcca40
3
+ size 27033600
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57d6844e6ed9acfc424464dd18302b0a44b653692aaa2086ee797365a2334a06
3
+ size 27033600
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6afa59d80288dfb4c18a61221be939d245cee60271c3bc1817463a2d13046bf4
3
+ size 73400320
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68143c2c28787595bd0e1f716ba8bca7f2cd508c373df21da1f7e63875f76ba3
3
+ size 30494720
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:729c5a1d79848dffd9d29531a88a08991877edc18896288dcf2737cee1fa97fa
3
+ size 36700160
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac043e43c896308cd3c65f6c9ea84268571b2942e866ff60cb73bc625dd4c03e
3
+ size 73400320
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d9a0e9ef1cad1fb5b08fef5d83b45a10ae7e437b70f17cec4496389710ceb50
3
+ size 30494720
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcf295e9963d9796234a52101af54cce247074127f5338a6a458b9998782bf7c
3
+ size 36700160
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:104866d8cbe1c863ff6c09e0e7cb1d5fca9d1ba711cfd802d73c22aa58a0224f
3
+ size 73400320
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae2484c5a09d8eb5799684e71d99e97827e6ede847a5c9d93dc7b2b60b690d5d
3
+ size 73400320
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b736c09ec99249ec01abc68353851ab1c6781639b601e43b890684b824b11507
3
+ size 30494720
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c2c83496cad9aaffdc28255771ced19a5fa10ba1f0bbcb01918c8ff1b6a5f09
3
+ size 335544320
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79866085d41f512702c155ff567e3b1c2036c3a835c8718d7b65b9747708af28
3
+ size 36700160
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4d3f3b57ec0c8248001cb14bb3aacce3f9288555db080f9146d5bb25d4308a1
3
+ size 73400320
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd7855dcdbcef1df48b76c8be33872228b53d0478132810c8d29b74e3f0c470f
3
+ size 24770560
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d9fd149e3f4bbc9a999c0eece952d2c72de6e2ae4c93ed70b1660530d49e443
3
+ size 36700160
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef69c922eb44ccbeaef4319db53c057ade07d9b04208abba5241130db64ed904
3
+ size 73400320
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8fc54260bfc8b143549371dd6ed9ce0fac7375523381f093a5d7e102215d8a8
3
+ size 30494720
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ab4906d04156736b0c48f9f57471260c71199f26e8c29e880dd3ca5b126de47
3
+ size 36700160