File tree 2 files changed +13
-9
lines changed
2 files changed +13
-9
lines changed Original file line number Diff line number Diff line change @@ -39,6 +39,7 @@ import { google } from "@ai-sdk/google";
39
39
import { anthropic } from "@ai-sdk/anthropic" ;
40
40
import { groq } from "@ai-sdk/groq" ;
41
41
import { cerebras } from "@ai-sdk/cerebras" ;
42
+ import { openai } from "@ai-sdk/openai" ;
42
43
dotenv . config ( ) ;
43
44
44
45
/**
@@ -274,14 +275,12 @@ const generateFilteredTestcases = (): Testcase[] => {
274
275
275
276
// Execute the task
276
277
let llmClient : LLMClient ;
277
- if ( input . modelName . startsWith ( "gpt" ) ) {
278
- llmClient = new CustomOpenAIClient ( {
279
- modelName : input . modelName as AvailableModel ,
280
- client : wrapOpenAI (
281
- new OpenAI ( {
282
- apiKey : process . env . OPENAI_API_KEY ,
283
- } ) ,
284
- ) ,
278
+ if (
279
+ input . modelName . startsWith ( "gpt" ) ||
280
+ input . modelName . startsWith ( "o" )
281
+ ) {
282
+ llmClient = new AISdkClient ( {
283
+ model : wrapAISDKModel ( openai ( input . modelName ) ) ,
285
284
} ) ;
286
285
} else if ( input . modelName . startsWith ( "gemini" ) ) {
287
286
llmClient = new AISdkClient ( {
Original file line number Diff line number Diff line change @@ -23,13 +23,18 @@ const ALL_EVAL_MODELS = [
23
23
"gemini-2.5-pro-exp-03-25" ,
24
24
"gemini-1.5-pro" ,
25
25
"gemini-1.5-flash-8b" ,
26
+ "gemini-2.5-flash-preview-04-17" ,
27
+ "gemini-2.5-pro-preview-03-25" ,
26
28
// ANTHROPIC
27
29
"claude-3-5-sonnet-latest" ,
28
30
"claude-3-7-sonnet-latest" ,
29
31
// OPENAI
30
32
"gpt-4o-mini" ,
31
33
"gpt-4o" ,
32
34
"gpt-4.5-preview" ,
35
+ "o3" ,
36
+ "o3-mini" ,
37
+ "o4-mini" ,
33
38
// TOGETHER - META
34
39
"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo" ,
35
40
"meta-llama/Llama-3.3-70B-Instruct-Turbo" ,
@@ -95,7 +100,7 @@ if (filterByEvalName && !tasksByName[filterByEvalName]) {
95
100
*/
96
101
const DEFAULT_EVAL_MODELS = process . env . EVAL_MODELS
97
102
? process . env . EVAL_MODELS . split ( "," )
98
- : [ "claude-3-5-sonnet-latest" , "gpt-4o-mini ", "gpt-4o " ] ;
103
+ : [ "gemini-2.5-pro-preview-03-25 " , "o3 " ] ;
99
104
100
105
/**
101
106
* getModelList:
You can’t perform that action at this time.
0 commit comments