From 10ceaa902d53b27d0724983b00a640399eb81325 Mon Sep 17 00:00:00 2001 From: Dev Aggarwal Date: Wed, 11 Sep 2024 21:15:38 +0530 Subject: [PATCH] Add AfroLlama3 v1 model --- daras_ai_v2/language_model.py | 8 ++++++++ scripts/init_llm_pricing.py | 12 ++++++++++++ 2 files changed, 20 insertions(+) diff --git a/daras_ai_v2/language_model.py b/daras_ai_v2/language_model.py index fbb744d7f..27f9c5786 100644 --- a/daras_ai_v2/language_model.py +++ b/daras_ai_v2/language_model.py @@ -329,6 +329,14 @@ class LargeLanguageModels(Enum): supports_json=True, ) + afrollama_v1 = LLMSpec( + label="AfroLlama3 v1 (Jacaranda)", + model_id="Jacaranda/AfroLlama_V1", + llm_api=LLMApis.self_hosted, + context_window=2048, + price=1, + is_chat_model=False, + ) sea_lion_7b_instruct = LLMSpec( label="SEA-LION-7B-Instruct [Deprecated] (aisingapore)", model_id="aisingapore/sea-lion-7b-instruct", diff --git a/scripts/init_llm_pricing.py b/scripts/init_llm_pricing.py index 18f69f0a4..7632b8bb1 100644 --- a/scripts/init_llm_pricing.py +++ b/scripts/init_llm_pricing.py @@ -662,6 +662,18 @@ def run(): pricing_url="https://docs.anthropic.com/claude/docs/models-overview#model-comparison", ) + # AfroLlama3 + + llm_pricing_create( + model_id="Jacaranda/AfroLlama_V1", + model_name=LargeLanguageModels.afrollama_v1.name, + unit_cost_input=5, + unit_cost_output=15, + unit_quantity=10**6, + provider=ModelProvider.aks, + notes="Same as GPT-4o. Note that the actual cost of this model is in GPU Milliseconds", + ) + # SEA-LION llm_pricing_create(