hf-llm-api

Sleeping

App Files Files Community

jonathanjordan21 commited on Aug 1

Commit

55ab28a

•

1 Parent(s): 6f4d127

Update constants/models.py

Browse files

Files changed (1) hide show

constants/models.py +86 -24

constants/models.py CHANGED Viewed

@@ -9,10 +9,12 @@ MODEL_MAP = {
     "llama3-70b": "meta-llama/Meta-Llama-3-70B-Instruct",
     "zephyr-141b": "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
     "default": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
-    "Qwen2-72B": "Qwen/Qwen2-72B-Instruct",
-    "Qwen2-7B-Instruct": "Qwen/Qwen2-7B-Instruct",
-    "Qwen2-1.5B-Instruct" : "Qwen/Qwen2-1.5B-Instruct",
-    "llama3-8b" : "meta-llama/Meta-Llama-3-8B-Instruct"
 }
 AVAILABLE_MODELS = list(MODEL_MAP.keys())
@@ -36,12 +38,14 @@ STOP_SEQUENCES_MAP = {
     # https://huggingface.co/CohereForAI/c4ai-command-r-plus-4bit/blob/main/tokenizer_config.json#L305
     "command-r-plus": "<|END_OF_TURN_TOKEN|>",
     # https://huggingface.co/Qwen/Qwen2-72B-Instruct/blob/main/tokenizer_config.json#L30
-    "Qwen2-72B": "<|im_end|>",
-    "Qwen2-7B-Instruct": "<|im_end|>",
-    "Qwen2-1.5B-Instruct": "<|im_end|>",
     "llama3-8b" : "<|eot_id|>",
-    "llama3-70b" : "<|eot_id|>"
 }
 TOKEN_LIMIT_MAP = {
@@ -55,23 +59,24 @@ TOKEN_LIMIT_MAP = {
     "llama3-70b": 8192,
     "zephyr-141b": 2048,
     "gpt-3.5-turbo": 8192,
-    "Qwen2-72B": 32768,
-    "Qwen2-7B-Instruct": 32768,
-    "Qwen2-1.5B-Instruct": 32768,
     "llama3-8b": 8192,
 }
 TOKEN_RESERVED = 20
-# https://platform.openai.com/docs/api-reference/models/list
-AVAILABLE_MODELS_DICTS = [
     {
         "id": "mixtral-8x7b",
         "description": "[mistralai/Mixtral-8x7B-Instruct-v0.1]: https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1",
         "object": "model",
         "created": 1700000000,
         "owned_by": "mistralai",
     },
     {
         "id": "nous-mixtral-8x7b",
@@ -79,6 +84,7 @@ AVAILABLE_MODELS_DICTS = [
         "object": "model",
         "created": 1700000000,
         "owned_by": "NousResearch",
     },
     {
         "id": "mistral-7b",
@@ -86,6 +92,7 @@ AVAILABLE_MODELS_DICTS = [
         "object": "model",
         "created": 1700000000,
         "owned_by": "mistralai",
     },
     {
         "id": "yi-1.5-34b",
@@ -93,6 +100,7 @@ AVAILABLE_MODELS_DICTS = [
         "object": "model",
         "created": 1700000000,
         "owned_by": "01-ai",
     },
     {
         "id": "gemma-7b",
@@ -100,63 +108,92 @@ AVAILABLE_MODELS_DICTS = [
         "object": "model",
         "created": 1700000000,
         "owned_by": "Google",
     },
     {
         "id": "openchat-3.5",
         "description": "[openchat/openchat-3.5-0106]: https://huggingface.co/openchat/openchat-3.5-0106",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "openchat"
     },
     {
         "id": "command-r-plus",
         "description": "[CohereForAI/c4ai-command-r-plus]: https://huggingface.co/CohereForAI/c4ai-command-r-plus",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "CohereForAI"
     },
     {
         "id": "llama3-70b",
         "description": "[meta-llama/Meta-Llama-3-70B]: https://huggingface.co/meta-llama/Meta-Llama-3-70B",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "Meta"
     },
     {
         "id": "zephyr-141b",
         "description": "[HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1]: https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "Huggingface"
     },
     {
         "id": "gpt-3.5-turbo",
         "description": "[openai/gpt-3.5-turbo]: https://platform.openai.com/docs/models/gpt-3-5-turbo",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "OpenAI"
     },
     {
-        "id": "Qwen2-72B",
         "description": "[Qwen/Qwen2-72B]: https://huggingface.co/Qwen/Qwen2-72B",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "Qwen"
     },
     {
         "id": "llama3-8b",
         "description": "[meta-llama/Meta-Llama-3-8B]: https://huggingface.co/meta-llama/Meta-Llama-3-8B",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "Meta"
     },
     {
-        "id": "Qwen2-1.5B-Instruct",
         "description": "[Qwen/Qwen2-1.5B-Instruct]: https://huggingface.co/Qwen/Qwen2-1.5B-Instruct",
         "object": "model",
         "created": 1700000000,
-        "owned_by": "Qwen"
     },
     {
         "id": "nomic-text-embed",
         "description": "[nomic-ai/nomic-embed-text-v1.5]: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5",
@@ -171,4 +208,29 @@ AVAILABLE_MODELS_DICTS = [
         "created": 1700000000,
         "owned_by": "mixedbread-ai"
     },
 ]

     "llama3-70b": "meta-llama/Meta-Llama-3-70B-Instruct",
     "zephyr-141b": "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
     "default": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
+    "qwen2-72b": "Qwen/Qwen2-72B-Instruct",
+    "qwen2-7b-instruct": "Qwen/Qwen2-7B-Instruct",
+    "qwen2-1.5b-instruct" : "Qwen/Qwen2-1.5B-Instruct",
+    "llama3-8b" : "meta-llama/Meta-Llama-3-8B-Instruct",
+    "mistral-nemo-instruct":"mistralai/Mistral-Nemo-Instruct-2407",
+    "zephyr-7b-beta":"HuggingFaceH4/zephyr-7b-beta"
 }
 AVAILABLE_MODELS = list(MODEL_MAP.keys())
     # https://huggingface.co/CohereForAI/c4ai-command-r-plus-4bit/blob/main/tokenizer_config.json#L305
     "command-r-plus": "<|END_OF_TURN_TOKEN|>",
     # https://huggingface.co/Qwen/Qwen2-72B-Instruct/blob/main/tokenizer_config.json#L30
+    "qwen2-72b": "<|im_end|>",
+    "qwen2-7b-instruct": "<|im_end|>",
+    "qwen2-1.5b-instruct": "<|im_end|>",
     "llama3-8b" : "<|eot_id|>",
+    "llama3-70b" : "<|eot_id|>",
+    "mistral-nemo-instruct": "</s>",
+    "zephyr-7b-beta":"</s>"
 }
 TOKEN_LIMIT_MAP = {
     "llama3-70b": 8192,
     "zephyr-141b": 2048,
     "gpt-3.5-turbo": 8192,
+    "qwen2-72b": 32768,
+    "qwen2-7b-instruct": 32768,
+    "qwen2-1.5b-instruct": 32768,
     "llama3-8b": 8192,
+    "mistral-nemo-instruct":128000,
+    "zephyr-7b-beta":32768,
 }
 TOKEN_RESERVED = 20
+LLM_MODELS_DICTS = [
     {
         "id": "mixtral-8x7b",
         "description": "[mistralai/Mixtral-8x7B-Instruct-v0.1]: https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1",
         "object": "model",
         "created": 1700000000,
         "owned_by": "mistralai",
+        "type": "basic",
     },
     {
         "id": "nous-mixtral-8x7b",
         "object": "model",
         "created": 1700000000,
         "owned_by": "NousResearch",
+        "type": "basic",
     },
     {
         "id": "mistral-7b",
         "object": "model",
         "created": 1700000000,
         "owned_by": "mistralai",
+        "type": "basic",
     },
     {
         "id": "yi-1.5-34b",
         "object": "model",
         "created": 1700000000,
         "owned_by": "01-ai",
+        "type": "pro",
     },
     {
         "id": "gemma-7b",
         "object": "model",
         "created": 1700000000,
         "owned_by": "Google",
+        "type": "basic",
     },
     {
         "id": "openchat-3.5",
         "description": "[openchat/openchat-3.5-0106]: https://huggingface.co/openchat/openchat-3.5-0106",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "openchat",
+        "type": "basic",
     },
     {
         "id": "command-r-plus",
         "description": "[CohereForAI/c4ai-command-r-plus]: https://huggingface.co/CohereForAI/c4ai-command-r-plus",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "CohereForAI",
+        "type": "pro",
     },
     {
         "id": "llama3-70b",
         "description": "[meta-llama/Meta-Llama-3-70B]: https://huggingface.co/meta-llama/Meta-Llama-3-70B",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "Meta",
+        "type": "pro",
     },
     {
         "id": "zephyr-141b",
         "description": "[HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1]: https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "Huggingface",
+        "type": "pro",
     },
     {
         "id": "gpt-3.5-turbo",
         "description": "[openai/gpt-3.5-turbo]: https://platform.openai.com/docs/models/gpt-3-5-turbo",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "OpenAI",
+        "type": "subscription",
     },
     {
+        "id": "qwen2-72b",
         "description": "[Qwen/Qwen2-72B]: https://huggingface.co/Qwen/Qwen2-72B",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "Qwen",
+        "type": "pro",
     },
     {
         "id": "llama3-8b",
         "description": "[meta-llama/Meta-Llama-3-8B]: https://huggingface.co/meta-llama/Meta-Llama-3-8B",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "Meta",
+        "type": "basic",
     },
     {
+        "id": "qwen2-1.5b-instruct",
         "description": "[Qwen/Qwen2-1.5B-Instruct]: https://huggingface.co/Qwen/Qwen2-1.5B-Instruct",
         "object": "model",
         "created": 1700000000,
+        "owned_by": "Qwen",
+        "type": "basic",
+    },
+    {
+        "id": "mistral-nemo-instruct",
+        "description": "[mistralai/Mistral-Nemo-Instruct-2407]: https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407",
+        "object": "model",
+        "created": 1700000000,
+        "owned_by": "mistralai",
+        "type": "basic",
+    },
+    {
+        "id": "zephyr-7b-beta",
+        "description": "[HuggingFaceH4/zephyr-7b-beta]: https://huggingface.co/HuggingFaceH4/zephyr-7b-beta",
+        "object": "model",
+        "created": 1700000000,
+        "owned_by": "HuggingFaceH4",
+        "type": "basic",
     },
+]
+EMBEDDINGS_MODELS_DICTS = [
     {
         "id": "nomic-text-embed",
         "description": "[nomic-ai/nomic-embed-text-v1.5]: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5",
         "created": 1700000000,
         "owned_by": "mixedbread-ai"
     },
+    {
+        "id": "mixbread-ai/mxbai-embed-large-v1",
+        "description": "[mixedbread-ai/mxbai-embed-large-v1]: https://huggingface.co/mixedbread-ai/mxbai-embed-large-v1",
+        "object": "embeddings",
+        "created": 1700000000,
+        "owned_by": "mixedbread-ai"
+    },
+    {
+        "id": "multilingual-e5-large-instruct",
+        "description": "[intfloat/multilingual-e5-large-instruct]: https://huggingface.co/intfloat/multilingual-e5-large-instruct",
+        "object": "embeddings",
+        "created": 1700000000,
+        "owned_by": "intfloat"
+    },
+    {
+        "id": "intfloat/multilingual-e5-large-instruct",
+        "description": "[intfloat/multilingual-e5-large-instruct]: https://huggingface.co/intfloat/multilingual-e5-large-instruct",
+        "object": "embeddings",
+        "created": 1700000000,
+        "owned_by": "intfloat"
+    },
 ]
+# https://platform.openai.com/docs/api-reference/models/list
+AVAILABLE_MODELS_DICTS = LLM_MODELS_DICTS + EMBEDDINGS_MODELS_DICTS