@@ -225,7 +225,8 @@ class _OvhLlm(_Llm):
225
225
def __init__ (self , model : str , display_model : Optional [str ] = None ):
226
226
super ().__init__ (
227
227
"" ,
228
- "cloud.ovh.net/" + display_model ,
228
+ f"endpoints.ai.cloud.ovh.net/{ model } " ,
229
+ api_key = os .getenv ("OVH_AI_ENDPOINTS_API_KEY" ),
229
230
base_url = f"https://{ model } .endpoints.kepler.ai.cloud.ovh.net/api/openai_compat/v1" ,
230
231
)
231
232
@@ -352,6 +353,7 @@ def _text_models():
352
353
_GroqLlm ("mixtral-8x7b-32768" , MIXTRAL_8X7B_INSTRUCT_FP8 ),
353
354
_NvidiaLlm ("mistralai/mixtral-8x7b-instruct-v0.1-turbo" , MIXTRAL_8X7B_INSTRUCT_FP8 ),
354
355
_TogetherLlm ("mistralai/Mixtral-8x7B-Instruct-v0.1" , MIXTRAL_8X7B_INSTRUCT ),
356
+ _OvhLlm ("mixtral-8x7b-instruct-v01" , MIXTRAL_8X7B_INSTRUCT ),
355
357
# Llama 3.1 405b
356
358
_DatabricksLlm ("databricks-meta-llama-3.1-405b-instruct" , LLAMA_31_405B_CHAT ),
357
359
_DeepInfraLlm (
@@ -365,7 +367,7 @@ def _text_models():
365
367
_TogetherLlm (
366
368
"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo" , LLAMA_31_405B_CHAT_FP8
367
369
),
368
- # _OvhLlm("llama-3p1 -405b-instruct", LLAMA_31_405B_CHAT),
370
+ # _OvhLlm("llama-3-1 -405b-instruct", LLAMA_31_405B_CHAT),
369
371
# Llama 3.1 70b
370
372
_CerebrasLlm ("llama3.1-70b" , LLAMA_31_70B_CHAT ),
371
373
_CloudflareLlm ("@cf/meta/llama-3.1-70b-preview" , LLAMA_31_70B_CHAT ),
@@ -380,7 +382,7 @@ def _text_models():
380
382
_TogetherLlm (
381
383
"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo" , LLAMA_31_70B_CHAT_FP8
382
384
),
383
- # _OvhLlm("llama-3p1-8b- instruct", LLAMA_31_8B_CHAT ),
385
+ _OvhLlm ("llama-3-1-70b- instruct" , LLAMA_31_70B_CHAT ),
384
386
# Llama 3.1 8b
385
387
_CerebrasLlm ("llama3.1-8b" , LLAMA_31_8B_CHAT ),
386
388
_CloudflareLlm ("@cf/meta/llama-3.1-8b-preview" , LLAMA_31_8B_CHAT ),
@@ -395,7 +397,7 @@ def _text_models():
395
397
_TogetherLlm (
396
398
"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo" , LLAMA_31_8B_CHAT_FP8
397
399
),
398
- # _OvhLlm("llama-3p1-70b- instruct", LLAMA_31_70B_CHAT ),
400
+ # _OvhLlm("llama-3-1-8b- instruct", LLAMA_31_8B_CHAT ),
399
401
# Llama 3 70b
400
402
_DatabricksLlm ("databricks-meta-llama-3-70b-instruct" , LLAMA_3_70B_CHAT ),
401
403
_DeepInfraLlm ("meta-llama/Meta-Llama-3-70B-Instruct" , LLAMA_3_70B_CHAT ),
0 commit comments