We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3daa122 commit ab47c30Copy full SHA for ab47c30
1 file changed
tests/unit/rl_utils_test.py
@@ -180,10 +180,11 @@ def test_score_duplicate_reasoning_start_tag(self):
180
@pytest.mark.cpu_only
181
def test_score_multiple_completions(self):
182
# Multiple completions at once -> one score per entry
183
- scores = self._score([
+ multi_completions = [
184
"<reasoning>think</reasoning><answer>42</answer>", # 2.0
185
"no tags here", # -2.0
186
- ])
+ ]
187
+ scores = self._score(multi_completions)
188
self.assertEqual(len(scores), 2)
189
self.assertEqual(scores[0], 2.0)
190
self.assertEqual(scores[1], -2.0)
0 commit comments