MLX
mixtral
Mixture of Experts
mzbac commited on
Commit
325b10e
1 Parent(s): 5e7d4bd

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -7,6 +7,7 @@ language:
7
  - en
8
  license: apache-2.0
9
  tags:
 
10
  - mlx
11
  ---
12
 
 
7
  - en
8
  license: apache-2.0
9
  tags:
10
+ - moe
11
  - mlx
12
  ---
13
 
config.json CHANGED
@@ -26,6 +26,7 @@
26
  "tf_legacy_loss": false,
27
  "pruned_heads": {},
28
  "tie_word_embeddings": false,
 
29
  "is_encoder_decoder": false,
30
  "is_decoder": false,
31
  "cross_attention_hidden_size": null,
@@ -48,7 +49,6 @@
48
  "encoder_no_repeat_ngram_size": 0,
49
  "bad_words_ids": null,
50
  "num_return_sequences": 1,
51
- "chunk_size_feed_forward": 0,
52
  "output_scores": false,
53
  "return_dict_in_generate": false,
54
  "forced_bos_token_id": null,
@@ -78,8 +78,8 @@
78
  "decoder_start_token_id": null,
79
  "task_specific_params": null,
80
  "problem_type": null,
81
- "_name_or_path": "/Users/anchenli/.cache/huggingface/hub/models--mistralai--Mixtral-8x7B-v0.1/snapshots/58301445dc1378584211722b7ebf8743ec4e192b",
82
- "transformers_version": "4.37.0.dev0",
83
  "model_type": "mixtral",
84
  "quantization": {
85
  "group_size": 64,
 
26
  "tf_legacy_loss": false,
27
  "pruned_heads": {},
28
  "tie_word_embeddings": false,
29
+ "chunk_size_feed_forward": 0,
30
  "is_encoder_decoder": false,
31
  "is_decoder": false,
32
  "cross_attention_hidden_size": null,
 
49
  "encoder_no_repeat_ngram_size": 0,
50
  "bad_words_ids": null,
51
  "num_return_sequences": 1,
 
52
  "output_scores": false,
53
  "return_dict_in_generate": false,
54
  "forced_bos_token_id": null,
 
78
  "decoder_start_token_id": null,
79
  "task_specific_params": null,
80
  "problem_type": null,
81
+ "_name_or_path": "/Users/anchenli/.cache/huggingface/hub/models--mistralai--Mixtral-8x7B-v0.1/snapshots/985aa055896a8f943d4a9f2572e6ea1341823841",
82
+ "transformers_version": "4.37.1",
83
  "model_type": "mixtral",
84
  "quantization": {
85
  "group_size": 64,
model-00001-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7137734d473eae883e8a36945d8c9d76b8b8e8d2ccde5c2fdad98ff07459d539
3
+ size 5349412303
model-00002-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a571d33c64bd2d0e224cfd89985bc16c0200138cbefddc8ce6eaa6e8e89f56b0
3
+ size 5360883248
model-00003-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd47b28a78e7ad5f49d8a2a2c466bf984f23804b3c4fdab28dcdc76d59fde220
3
+ size 5351529568
model-00004-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56252510aa9321a7cae71ea94401f5f3e1045b44a62f057b89f540fc360e3189
3
+ size 5360883534
model-00005-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6573a82fca203c5496b818733308ab440181796cb019f582bd73f7c4db2fb23e
3
+ size 5038270293