@@ -248,6 +248,18 @@ def __init__(self, model: str, display_model: Optional[str] = None):
248
248
)
249
249
250
250
251
+ class _CerebrasLlm (_Llm ):
252
+ """See https://docs.cerebras.ai/en/latest/wsc/Model-zoo/MZ-overview.html#list-of-models"""
253
+
254
+ def __init__ (self , model : str , display_model : Optional [str ] = None ):
255
+ super ().__init__ (
256
+ model ,
257
+ "api.cerebras.ai/" + (display_model or model ),
258
+ api_key = os .getenv ("CEREBRAS_API_KEY" ),
259
+ base_url = "https://api.cerebras.ai/v1" ,
260
+ )
261
+
262
+
251
263
def _text_models ():
252
264
AZURE_EASTUS2_OPENAI_API_KEY = os .getenv ("AZURE_EASTUS2_OPENAI_API_KEY" )
253
265
return [
@@ -358,6 +370,7 @@ def _text_models():
358
370
_TogetherLlm (
359
371
"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo" , LLAMA_31_70B_CHAT_FP8
360
372
),
373
+ _CerebrasLlm ("llama3.1-70b" , LLAMA_31_70B_CHAT ),
361
374
# _OvhLlm("llama-3p1-8b-instruct", LLAMA_31_8B_CHAT),
362
375
# Llama 3.1 8b
363
376
# _DatabricksLlm("databricks-meta-llama-3.1-8b-instruct", LLAMA_31_8B_CHAT),
@@ -371,6 +384,7 @@ def _text_models():
371
384
_TogetherLlm (
372
385
"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo" , LLAMA_31_8B_CHAT_FP8
373
386
),
387
+ _CerebrasLlm ("llama3.1-8b" , LLAMA_31_8B_CHAT ),
374
388
# _OvhLlm("llama-3p1-70b-instruct", LLAMA_31_70B_CHAT),
375
389
# Llama 3 70b
376
390
_DatabricksLlm ("databricks-meta-llama-3-70b-instruct" , LLAMA_3_70B_CHAT ),
0 commit comments