Former-commit-id: e5e6a0c50c7a1c0052ed6b459450b9735ff2c9a1
This commit is contained in:
hiyouga
2024-03-28 20:22:31 +08:00
parent f0e564beaa
commit 9408366a36
4 changed files with 12 additions and 14 deletions

View File

@@ -118,10 +118,6 @@ class RLHFArguments:
default=4,
metadata={"help": "The number of epochs to perform in a PPO optimization step."},
)
ppo_logger: Optional[str] = field(
default=None,
metadata={"help": 'Log with either "wandb" or "tensorboard" in PPO training.'},
)
ppo_score_norm: bool = field(
default=False,
metadata={"help": "Use score normalization in PPO training."},