GGUF
Inference Endpoints
van-qa commited on
Commit
062e706
1 Parent(s): c96f438

Create metadata.yaml

Browse files
Files changed (1) hide show
  1. metadata.yaml +11 -0
metadata.yaml ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: mistral
2
+
3
+ default:
4
+ - main: Mistral-7B-Instruct-v0.3 Q4_K_M
5
+ - gguf: Mistral-7B-Instruct-v0.3 Q4_K_M
6
+ - onnx: Mistral-7B-Instruct-v0.3 AWQ INT4
7
+ - tensorrt-llm: Mistral-7B-Instruct-v0.3 AWQ INT4
8
+ 7b:
9
+ - gguf: Mistral-7B-Instruct-v0.3 Q4_K_M
10
+ - onnx: Mistral-7B-Instruct-v0.3 AWQ INT4
11
+ - tensorrt-llm: Mistral-7B-Instruct-v0.3 AWQ INT4