@@ -38,6 +38,7 @@ def _make_config():
3838 reasoning_end_token = "</reasoning>" ,
3939 solution_start_token = "<answer>" ,
4040 solution_end_token = "</answer>" ,
41+ reward_exact_answer = 3.0 ,
4142 reward_exact_format_match = 2.0 ,
4243 reward_partial_format_match = 0.5 ,
4344 reward_white_space_format_match = 1.5 ,
@@ -223,7 +224,7 @@ def test_extraction_succeeds_full_format(self):
223224 completions = ["<reasoning>40 + 2 = 42</reasoning><answer>42</answer>" ],
224225 answer = ["42" ],
225226 )
226- self .assertEqual (scores [0 ], 1.5 )
227+ self .assertEqual (scores [0 ], self . config . reward_exact_answer )
227228
228229 @pytest .mark .cpu_only
229230 def test_extraction_fails_no_tags (self ):
@@ -241,7 +242,7 @@ def test_extraction_fails_answer_tags_only(self):
241242 completions = ["<answer>42</answer>" ],
242243 answer = ["42" ],
243244 )
244- self .assertEqual (scores [0 ], 1.5 )
245+ self .assertEqual (scores [0 ], self . config . reward_exact_answer )
245246
246247 @pytest .mark .cpu_only
247248 def test_extraction_fails_reasoning_tags_only (self ):
@@ -262,7 +263,7 @@ def test_extraction_batch_mixed(self):
262263 ],
263264 answer = ["7" , "7" ],
264265 )
265- self .assertEqual (scores [0 ], 1.5 )
266+ self .assertEqual (scores [0 ], self . config . reward_exact_answer )
266267 self .assertEqual (scores [1 ], 0 )
267268
268269 # ---------------------------------------------------------------
@@ -276,7 +277,7 @@ def test_extracted_matches_integer_answer(self):
276277 completions = ["<reasoning>simple</reasoning><answer>100</answer>" ],
277278 answer = ["100" ],
278279 )
279- self .assertEqual (scores [0 ], 1.5 )
280+ self .assertEqual (scores [0 ], self . config . reward_exact_answer )
280281
281282 @pytest .mark .cpu_only
282283 def test_extracted_does_not_match_answer (self ):
@@ -294,7 +295,7 @@ def test_extracted_matches_comma_formatted_number(self):
294295 completions = ["<reasoning>cost calculation</reasoning><answer>1,000</answer>" ],
295296 answer = ["1000" ],
296297 )
297- self .assertEqual (scores [0 ], 1.5 )
298+ self .assertEqual (scores [0 ], self . config . reward_exact_answer )
298299
299300 @pytest .mark .cpu_only
300301 def test_extracted_matches_with_currency_prefix (self ):
@@ -303,7 +304,7 @@ def test_extracted_matches_with_currency_prefix(self):
303304 completions = ["<reasoning>price is $16</reasoning><answer>$16</answer>" ],
304305 answer = ["16" ],
305306 )
306- self .assertEqual (scores [0 ], 1.5 )
307+ self .assertEqual (scores [0 ], self . config . reward_exact_answer )
307308
308309 @pytest .mark .cpu_only
309310 def test_extracted_non_numeric_no_match (self ):
0 commit comments