We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent fc865f4 commit f5ad62cCopy full SHA for f5ad62c
1 file changed
src/maxtext/trainers/post_train/rl/utils_rl.py
@@ -108,7 +108,6 @@ def get_match_format_regex(tmvp_config):
108
r"^[\s]{0,}"
109
rf"{tmvp_config.reasoning_start_token}.+?{tmvp_config.reasoning_end_token}.*?"
110
rf"{tmvp_config.solution_start_token}(.+?){tmvp_config.solution_end_token}"
111
- r"[\s]{0,}$"
112
),
113
flags=re.MULTILINE | re.DOTALL,
114
)
@@ -308,7 +307,7 @@ def fix_latex_escaping(text: str) -> str:
308
307
("\t", "imes", r"\times"), # \t (tab) → \times
309
("\t", "ext", r"\text"), # \t (tab) → \text
310
("\t", "extbf", r"\textbf"), # \t (tab) → \textbf
311
- ("\t", "extit", r"\textit"), # \t (tab) → \textit
+ ("\t", "extit", r"\textit"), # \t (tab) → \textit # codespell:ignore
312
("\r", "ightarrow", r"\rightarrow"), # \r (carriage return) → \rightarrow
313
("\r", "ightarrow", r"\Rightarrow"), # \r (carriage return) → \Rightarrow (capital R handled separately)
314
("\b", "eta", r"\beta"), # \b (backspace) → \beta
0 commit comments