fix style

This commit is contained in:
YeAnbang
2024-07-26 09:55:15 +00:00
parent 9688e19b32
commit 8a3ff4f315
7 changed files with 10 additions and 15 deletions

View File

@@ -26,7 +26,7 @@ from .utils import is_rank_0, to_device
class ORPOTrainer(SLTrainer):
"""
Trainer for PPO algorithm.
Trainer for ORPO algorithm.
Args:
actor (Actor): the actor model in ppo algorithm