add boxed reward

This commit is contained in:
YeAnbang 2025-04-28 18:15:43 +08:00
parent 14c01aec00
commit 064be50946

View File

@ -144,8 +144,8 @@ if __name__ == "__main__":
max_length=args.max_new_tokens + args.max_prompt_tokens,
do_sample=True,
max_new_tokens=None,
early_stopping=False,
stop_strings=["</answer>"],
early_stopping=False if args.reward_type == "think_answer_tags" else True,
stop_strings=["</answer>"] if args.reward_type == "think_answer_tags" else None,
)
)
elif args.backend == "vllm":
@ -161,9 +161,9 @@ if __name__ == "__main__":
generate_config.update(
dict(
max_tokens=args.max_new_tokens, # max new tokens
ignore_eos=True,
ignore_eos=True if args.reward_type == "think_answer_tags" else False,
include_stop_str_in_output=True,
stop=["</answer>"],
stop=["</answer>"] if args.reward_type == "think_answer_tags" else None,
)
)
else: