@@ -168,6 +168,7 @@ async def test_evaluate_success_with_valid_response(
168168
169169 assert isinstance (result , JudgeResult )
170170 assert result .success is True
171+ assert result .sampled is True
171172 assert result .metric_key == '$ld:ai:judge:relevance'
172173 assert result .score == 0.85
173174 assert result .reasoning is not None
@@ -194,6 +195,7 @@ async def test_evaluate_success_with_evaluation_response_shape(
194195
195196 assert isinstance (result , JudgeResult )
196197 assert result .success is True
198+ assert result .sampled is True
197199 assert result .metric_key == '$ld:ai:judge:relevance'
198200 assert result .score == 0.9
199201 assert result .reasoning is not None
@@ -288,13 +290,13 @@ async def test_evaluate_handles_exception(
288290 async def test_evaluate_respects_sampling_rate (
289291 self , judge_config_with_key : AIJudgeConfig , tracker : LDAIConfigTracker , mock_runner
290292 ):
291- """Evaluate should return sampled=True when skipped due to sampling rate."""
293+ """Evaluate should return sampled=False when skipped due to sampling rate."""
292294 judge = Judge (judge_config_with_key , tracker , mock_runner )
293295
294296 result = await judge .evaluate ("input" , "output" , sampling_rate = 0.0 )
295297
296298 assert isinstance (result , JudgeResult )
297- assert result .sampled is True
299+ assert result .sampled is False
298300 assert result .success is False
299301 mock_runner .invoke_structured_model .assert_not_called ()
300302
0 commit comments