Spaces:

karim23657
/

llm-api-hf

Sleeping

App Files Files Community

karim23657 commited on Apr 9

Commit

307fd9d

verified ·

1 Parent(s): 0c5bfb2

Update constants/models.py

Browse files

Files changed (1) hide show

constants/models.py +11 -0

constants/models.py CHANGED Viewed

@@ -12,6 +12,7 @@ MODEL_MAP = {
   "Hermes-3-Llama-3.1-8B": "NousResearch/Hermes-3-Llama-3.1-8B",
   "Mistral-Nemo-Instruct-2407": "mistralai/Mistral-Nemo-Instruct-2407",
   "Phi-3.5-mini-instruct": "microsoft/Phi-3.5-mini-instruct",
     "nous-mixtral-8x7b": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
     "mistral-7b": "mistralai/Mistral-7B-Instruct-v0.2",
     "yi-1.5-34b": "01-ai/Yi-1.5-34B-Chat",
@@ -53,6 +54,7 @@ STOP_SEQUENCES_MAP = {
     "Qwen2.5-72B-Instruct":"<|im_end|>",
     # https://huggingface.co/unsloth/DeepSeek-R1-Distill-Qwen-32B/blob/main/tokenizer_config.json
     "DeepSeek-R1-Distill-Qwen-32B":"<｜end▁of▁sentence｜>",
     # "openchat-3.5": "<|end_of_turn|>",
     # "command-r-plus": "<|END_OF_TURN_TOKEN|>",
@@ -68,6 +70,7 @@ TOKEN_LIMIT_MAP = {
     "c4ai-command-r-plus-08-2024":1000000000000000019884624838656,
     "Qwen2.5-72B-Instruct":131072,
     "DeepSeek-R1-Distill-Qwen-32B":131072,
     # "openchat-3.5": 8192,
     # "command-r-plus": 32768,
@@ -109,6 +112,14 @@ AVAILABLE_MODELS_DICTS = [
     "created": 1700000000,
     "owned_by": "deepseek-ai"
   },
   {
     "id": "Llama-3.1-Nemotron-70B-Instruct-HF",
     "description": "[nvidia/Llama-3.1-Nemotron-70B-Instruct-HF]: https://huggingface.co/nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",

   "Hermes-3-Llama-3.1-8B": "NousResearch/Hermes-3-Llama-3.1-8B",
   "Mistral-Nemo-Instruct-2407": "mistralai/Mistral-Nemo-Instruct-2407",
   "Phi-3.5-mini-instruct": "microsoft/Phi-3.5-mini-instruct",
+  "DeepSeek-V3-0324": "deepseek-ai/DeepSeek-V3-0324",
     "nous-mixtral-8x7b": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
     "mistral-7b": "mistralai/Mistral-7B-Instruct-v0.2",
     "yi-1.5-34b": "01-ai/Yi-1.5-34B-Chat",
     "Qwen2.5-72B-Instruct":"<|im_end|>",
     # https://huggingface.co/unsloth/DeepSeek-R1-Distill-Qwen-32B/blob/main/tokenizer_config.json
     "DeepSeek-R1-Distill-Qwen-32B":"<｜end▁of▁sentence｜>",
+    "DeepSeek-V3-0324":"<｜end▁of▁sentence｜>",
     # "openchat-3.5": "<|end_of_turn|>",
     # "command-r-plus": "<|END_OF_TURN_TOKEN|>",
     "c4ai-command-r-plus-08-2024":1000000000000000019884624838656,
     "Qwen2.5-72B-Instruct":131072,
     "DeepSeek-R1-Distill-Qwen-32B":131072,
+    "DeepSeek-R1-Distill-Qwen-32B":131072,
     # "openchat-3.5": 8192,
     # "command-r-plus": 32768,
     "created": 1700000000,
     "owned_by": "deepseek-ai"
   },
+  },
+  {
+    "id": "DeepSeek-V3-0324",
+    "description": "[deepseek-ai/DeepSeek-V3-0324]: https://huggingface.co/deepseek-ai/DeepSeek-V3-0324",
+    "object": "model",
+    "created": 1700000000,
+    "owned_by": "deepseek-ai"
+  },
   {
     "id": "Llama-3.1-Nemotron-70B-Instruct-HF",
     "description": "[nvidia/Llama-3.1-Nemotron-70B-Instruct-HF]: https://huggingface.co/nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",