fix shift short attention

Former-commit-id: 9a49cce8e6f6b222f74a07bdab40efee6a77b0f1
This commit is contained in:
hiyouga
2023-10-09 17:07:46 +08:00
parent 5c4248a29c
commit e387a50475
6 changed files with 46 additions and 52 deletions

View File

@@ -149,6 +149,9 @@ def get_train_args(
if general_args.stage == "ppo" and data_args.streaming:
raise ValueError("Streaming mode does not suppport PPO training currently.")
if general_args.stage == "ppo" and model_args.shift_attn:
raise ValueError("PPO training is incompatible with S^2-Attn.")
if training_args.max_steps == -1 and data_args.streaming:
raise ValueError("Please specify `max_steps` in streaming mode.")