@@ -124,6 +124,18 @@ async def run(self, pass_argv: List[str], spread: float) -> asyncio.Task:
124
124
return await llm_benchmark .run (full_argv )
125
125
126
126
127
+ class _CerebrasLlm (_Llm ):
128
+ """See https://docs.cerebras.ai/en/latest/wsc/Model-zoo/MZ-overview.html#list-of-models"""
129
+
130
+ def __init__ (self , model : str , display_model : Optional [str ] = None ):
131
+ super ().__init__ (
132
+ model ,
133
+ "cerebras.ai/" + (display_model or model ),
134
+ api_key = os .getenv ("CEREBRAS_API_KEY" ),
135
+ base_url = "https://api.cerebras.ai/v1" ,
136
+ )
137
+
138
+
127
139
class _CloudflareLlm (_Llm ):
128
140
"""See https://developers.cloudflare.com/workers-ai/models/"""
129
141
@@ -224,6 +236,17 @@ def __init__(
224
236
)
225
237
226
238
239
+ class _OvhLlm (_Llm ):
240
+ """See https://llama-3-70b-instruct.endpoints.kepler.ai.cloud.ovh.net/doc"""
241
+
242
+ def __init__ (self , model : str , display_model : Optional [str ] = None ):
243
+ super ().__init__ (
244
+ "" ,
245
+ "cloud.ovh.net/" + display_model ,
246
+ base_url = f"https://{ model } .endpoints.kepler.ai.cloud.ovh.net/api/openai_compat/v1" ,
247
+ )
248
+
249
+
227
250
class _PerplexityLlm (_Llm ):
228
251
"""See https://docs.perplexity.ai/docs/model-cards"""
229
252
@@ -248,26 +271,15 @@ def __init__(self, model: str, display_model: Optional[str] = None):
248
271
)
249
272
250
273
251
- class _OvhLlm (_Llm ):
252
- """See https://llama-3-70b-instruct.endpoints.kepler.ai.cloud.ovh.net/doc"""
253
-
254
- def __init__ (self , model : str , display_model : Optional [str ] = None ):
255
- super ().__init__ (
256
- "" ,
257
- "cloud.ovh.net/" + display_model ,
258
- base_url = f"https://{ model } .endpoints.kepler.ai.cloud.ovh.net/api/openai_compat/v1" ,
259
- )
260
-
261
-
262
- class _CerebrasLlm (_Llm ):
263
- """See https://docs.cerebras.ai/en/latest/wsc/Model-zoo/MZ-overview.html#list-of-models"""
274
+ class _UltravoxLlm (_Llm ):
275
+ """See https://docs.ultravox.ai/docs/models"""
264
276
265
277
def __init__ (self , model : str , display_model : Optional [str ] = None ):
266
278
super ().__init__ (
267
279
model ,
268
- "cerebras .ai/" + (display_model or model ),
269
- api_key = os .getenv ("CEREBRAS_API_KEY " ),
270
- base_url = "https://api.cerebras .ai/v1" ,
280
+ "ultravox .ai/" + (display_model or model ),
281
+ api_key = os .getenv ("ULTRAVOX_API_KEY " ),
282
+ base_url = "https://ultravox. api.fixie .ai/v1" ,
271
283
)
272
284
273
285
@@ -509,11 +521,8 @@ def _audio_models():
509
521
# _Llm(GPT_4O), doesn't support audio yet
510
522
_Llm (GEMINI_1_5_PRO ),
511
523
_Llm (GEMINI_1_5_FLASH ),
512
- _Llm (
513
- "fixie-ai/ultravox-v0.4" ,
514
- base_url = "https://ultravox.api.fixie.ai/v1" ,
515
- api_key = os .getenv ("ULTRAVOX_API_KEY" ),
516
- ),
524
+ _UltravoxLlm ("fixie-ai/ultravox-v0.4" , "ultravox-v0.4-8b" ),
525
+ _UltravoxLlm ("fixie-ai/ultravox-70B" , "ultravox-v0.4-70b" ),
517
526
_Llm (
518
527
"fixie-ai/ultravox-v0.2" ,
519
528
"baseten.co/ultravox-v0.2" ,
0 commit comments