We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents 7656eb8 + 5dd5b3c commit 2670a9eCopy full SHA for 2670a9e
1 file changed
src/maxtext/trainers/post_train/rl/utils_rl.py
@@ -105,7 +105,6 @@ def get_match_format_regex(tmvp_config):
105
"""Returns a compiled regex to extract the answer from a completion."""
106
match_format = re.compile(
107
(
108
- r"^[\s]{0,}"
109
rf"{tmvp_config.reasoning_start_token}.+{tmvp_config.reasoning_end_token}.*?"
110
rf"{tmvp_config.solution_start_token}(.+?){tmvp_config.solution_end_token}"
111
),
0 commit comments