From c758b403b75be4c0d4bed08d45044f81641e0b47 Mon Sep 17 00:00:00 2001 From: Moshe Malawachh Date: Thu, 16 Jan 2025 12:52:44 +0100 Subject: [PATCH] add bigger context to models and support deepseek too --- libertai_agents/libertai_agents/models/base.py | 4 +++- libertai_agents/libertai_agents/models/models.py | 5 +++++ 2 files changed, 8 insertions(+), 1 deletion(-) diff --git a/libertai_agents/libertai_agents/models/base.py b/libertai_agents/libertai_agents/models/base.py index e88e07a..5362d71 100644 --- a/libertai_agents/libertai_agents/models/base.py +++ b/libertai_agents/libertai_agents/models/base.py @@ -10,7 +10,9 @@ from libertai_agents.interfaces.tools import Tool ModelId = Literal[ - "NousResearch/Hermes-3-Llama-3.1-8B", "mistralai/Mistral-Nemo-Instruct-2407" + "NousResearch/Hermes-3-Llama-3.1-8B", + "mistralai/Mistral-Nemo-Instruct-2407", + "deepseek-ai/DeepSeek-V3", ] diff --git a/libertai_agents/libertai_agents/models/models.py b/libertai_agents/libertai_agents/models/models.py index 8c89978..1c0bf48 100644 --- a/libertai_agents/libertai_agents/models/models.py +++ b/libertai_agents/libertai_agents/models/models.py @@ -25,6 +25,11 @@ class FullModelConfiguration(ModelConfiguration): context_length=16384, constructor=HermesModel, ), + "deepseek-ai/DeepSeek-V3": FullModelConfiguration( + vm_url="https://curated.aleph.cloud/vm/9aa80dc7f00c515a5f56b70e65fdab4c367e35f341c3b4220419adb6ca86a33f/completion", + context_length=16384, + constructor=HermesModel, + ), "mistralai/Mistral-Nemo-Instruct-2407": FullModelConfiguration( vm_url="https://curated.aleph.cloud/vm/2c4ad0bf343fb12924936cbc801732d95ce90f84cd895aa8bee82c0a062815c2/completion", context_length=8192,