From 7e2ebee646847cc1fad07841830fc95a2db25b58 Mon Sep 17 00:00:00 2001 From: Kashif Rasul Date: Thu, 13 Feb 2025 11:43:42 +0100 Subject: [PATCH] Update src/open_r1/grpo.py Co-authored-by: lewtun --- src/open_r1/grpo.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/open_r1/grpo.py b/src/open_r1/grpo.py index 15f2c159..803a8da0 100644 --- a/src/open_r1/grpo.py +++ b/src/open_r1/grpo.py @@ -159,7 +159,7 @@ def main(script_args, training_args, model_args): ngram_size=script_args.repetition_n_grams, max_penalty=script_args.repetition_max_penalty, ), - "len_reward": len_reward, + "length": len_reward, } reward_funcs = [REWARD_FUNCS_REGISTRY[func] for func in script_args.reward_funcs]