HFLLMAPI

Sleeping

App Files Files Community

Husnain commited on Apr 20, 2024

Commit

56aa981

unverified ·

1 Parent(s): 827c283

⚡ [Enhance] Use nous-mixtral-8x7b as default model

Browse files

Files changed (1) hide show

constants/models.py +29 -11

constants/models.py CHANGED Viewed

@@ -6,16 +6,19 @@ MODEL_MAP = {
     "gemma-7b": "google/gemma-1.1-7b-it",
     "command-r-plus": "CohereForAI/c4ai-command-r-plus",
     "llama3-70b": "meta-llama/Meta-Llama-3-70B-Instruct",
-    "default": "mistralai/Mixtral-8x7B-Instruct-v0.1",
 }
 AVAILABLE_MODELS = list(MODEL_MAP.keys())
 STOP_SEQUENCES_MAP = {
     "mixtral-8x7b": "</s>",
     "nous-mixtral-8x7b": "<|im_end|>",
     "mistral-7b": "</s>",
-    "openchat-3.5": "<|end_of_turn|>",
     "gemma-7b": "<eos>",
     "command-r-plus": "<|END_OF_TURN_TOKEN|>",
 }
@@ -24,11 +27,12 @@ TOKEN_LIMIT_MAP = {
     "mixtral-8x7b": 32768,
     "nous-mixtral-8x7b": 32768,
     "mistral-7b": 32768,
-    "openchat-3.5": 8192,
     "gemma-7b": 8192,
-    "gpt-3.5-turbo": 8192,
     "command-r-plus": 32768,
     "llama3-70b": 8192,
 }
 TOKEN_RESERVED = 20
@@ -71,13 +75,27 @@ AVAILABLE_MODELS_DICTS = [
         "created": 1700000000,
         "owned_by": "Google",
     },
-    # {
-    #     "id": "command-r-plus",
-    #     "description": "[CohereForAI/c4ai-command-r-plus]: https://huggingface.co/CohereForAI/c4ai-command-r-plus",
-    #     "object": "model",
-    #     "created": 1700000000,
-    #     "owned_by": "CohereForAI",
-    # },
     {
         "id": "gpt-3.5-turbo",
         "description": "[openai/gpt-3.5-turbo]: https://platform.openai.com/docs/models/gpt-3-5-turbo",

     "gemma-7b": "google/gemma-1.1-7b-it",
     "command-r-plus": "CohereForAI/c4ai-command-r-plus",
     "llama3-70b": "meta-llama/Meta-Llama-3-70B-Instruct",
+    "zephyr-141b": "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
+    "default": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
 }
 AVAILABLE_MODELS = list(MODEL_MAP.keys())
+PRO_MODELS = ["command-r-plus", "llama3-70b", "zephyr-141b"]
 STOP_SEQUENCES_MAP = {
     "mixtral-8x7b": "</s>",
     "nous-mixtral-8x7b": "<|im_end|>",
     "mistral-7b": "</s>",
+    # "openchat-3.5": "<|end_of_turn|>",
     "gemma-7b": "<eos>",
     "command-r-plus": "<|END_OF_TURN_TOKEN|>",
 }
     "mixtral-8x7b": 32768,
     "nous-mixtral-8x7b": 32768,
     "mistral-7b": 32768,
+    # "openchat-3.5": 8192,
     "gemma-7b": 8192,
     "command-r-plus": 32768,
     "llama3-70b": 8192,
+    "zephyr-141b": 2048,
+    "gpt-3.5-turbo": 8192,
 }
 TOKEN_RESERVED = 20
         "created": 1700000000,
         "owned_by": "Google",
     },
+    {
+        "id": "command-r-plus",
+        "description": "[CohereForAI/c4ai-command-r-plus]: https://huggingface.co/CohereForAI/c4ai-command-r-plus",
+        "object": "model",
+        "created": 1700000000,
+        "owned_by": "CohereForAI",
+    },
+    {
+        "id": "llama3-70b",
+        "description": "[meta-llama/Meta-Llama-3-70B]: https://huggingface.co/meta-llama/Meta-Llama-3-70B",
+        "object": "model",
+        "created": 1700000000,
+        "owned_by": "Meta",
+    },
+    {
+        "id": "zephyr-141b",
+        "description": "[HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1]: https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
+        "object": "model",
+        "created": 1700000000,
+        "owned_by": "Huggingface",
+    },
     {
         "id": "gpt-3.5-turbo",
         "description": "[openai/gpt-3.5-turbo]: https://platform.openai.com/docs/models/gpt-3-5-turbo",