@@ -28,8 +28,8 @@ def test_llm_judge(row=None):
2828
2929 def fake_create_evaluation (** kwargs ):
3030 captured .update (kwargs )
31- # Simulate API response
32- return {"name" : kwargs .get ("evaluator_id" , "eval" )}
31+ # Simulate API response - returns (result, version_id) tuple
32+ return {"name" : kwargs .get ("evaluator_id" , "eval" )}, "v1"
3333
3434 monkeypatch .setattr (upload_mod , "create_evaluation" , fake_create_evaluation )
3535
@@ -40,7 +40,6 @@ def fake_create_evaluation(**kwargs):
4040 id = None ,
4141 display_name = None ,
4242 description = None ,
43- force = False ,
4443 yes = True ,
4544 )
4645
@@ -72,7 +71,8 @@ def test_llm_judge(row=None):
7271
7372 def fake_create_evaluation (** kwargs ):
7473 captured .update (kwargs )
75- return {"name" : kwargs .get ("evaluator_id" , "eval" )}
74+ # Simulate API response - returns (result, version_id) tuple
75+ return {"name" : kwargs .get ("evaluator_id" , "eval" )}, "v1"
7676
7777 monkeypatch .setattr (upload_mod , "create_evaluation" , fake_create_evaluation )
7878
@@ -83,7 +83,6 @@ def fake_create_evaluation(**kwargs):
8383 id = None ,
8484 display_name = None ,
8585 description = None ,
86- force = False ,
8786 yes = True ,
8887 )
8988
@@ -119,7 +118,8 @@ def test_llm_judge(row=None):
119118
120119 def fake_create_evaluation (** kwargs ):
121120 captured .update (kwargs )
122- return {"name" : kwargs .get ("evaluator_id" , "eval" )}
121+ # Simulate API response - returns (result, version_id) tuple
122+ return {"name" : kwargs .get ("evaluator_id" , "eval" )}, "v1"
123123
124124 monkeypatch .setattr (upload_mod , "create_evaluation" , fake_create_evaluation )
125125
@@ -130,7 +130,6 @@ def fake_create_evaluation(**kwargs):
130130 id = None ,
131131 display_name = None ,
132132 description = None ,
133- force = False ,
134133 yes = True ,
135134 )
136135
@@ -163,8 +162,8 @@ def test_llm_judge(row=None):
163162 monkeypatch .setenv ("FIREWORKS_API_BASE" , "https://dev.api.fireworks.ai" )
164163
165164 def fake_create_evaluation (** kwargs ):
166- # Simulate creation result with evaluator name
167- return {"name" : kwargs .get ("evaluator_id" , "eval" )}
165+ # Simulate creation result with evaluator name - returns (result, version_id) tuple
166+ return {"name" : kwargs .get ("evaluator_id" , "eval" )}, "v1"
168167
169168 monkeypatch .setattr (upload_mod , "create_evaluation" , fake_create_evaluation )
170169
@@ -174,7 +173,6 @@ def fake_create_evaluation(**kwargs):
174173 id = "quickstart-test-llm-judge" ,
175174 display_name = None ,
176175 description = None ,
177- force = True ,
178176 yes = True ,
179177 )
180178
@@ -204,7 +202,8 @@ def test_llm_judge(row=None):
204202 monkeypatch .setenv ("FIREWORKS_API_BASE" , "https://api.fireworks.ai" )
205203
206204 def fake_create_evaluation (** kwargs ):
207- return {"name" : kwargs .get ("evaluator_id" , "eval" )}
205+ # Simulate API response - returns (result, version_id) tuple
206+ return {"name" : kwargs .get ("evaluator_id" , "eval" )}, "v1"
208207
209208 monkeypatch .setattr (upload_mod , "create_evaluation" , fake_create_evaluation )
210209
@@ -214,7 +213,6 @@ def fake_create_evaluation(**kwargs):
214213 id = "quickstart-test-llm-judge" ,
215214 display_name = None ,
216215 description = None ,
217- force = False ,
218216 yes = True ,
219217 )
220218
0 commit comments