mirror of
https://github.com/hiyouga/LlamaFactory.git
synced 2026-03-20 11:43:08 +00:00
alter rewards data type
Former-commit-id: 3eb7eb2d37525da50fe401ab7c59532e6e1ef984
This commit is contained in:
@@ -70,7 +70,7 @@ def main():
|
||||
ppo_trainer.save_model()
|
||||
ppo_trainer.save_state() # must be after save_model
|
||||
if ppo_trainer.is_world_process_zero() and model_args.plot_loss:
|
||||
plot_loss(training_args, keys=["loss", "reward"])
|
||||
plot_loss(training_args.output_dir, keys=["loss", "reward"])
|
||||
|
||||
|
||||
def _mp_fn(index):
|
||||
|
||||
Reference in New Issue
Block a user