support full-parameter PPO
Former-commit-id: 4af967d69475e1c9fdf1a7983cd6b83bd431abff
This commit is contained in:
@@ -1,3 +1,3 @@
|
||||
from llmtuner.model.loader import load_model_and_tokenizer
|
||||
from llmtuner.model.parser import get_train_args, get_infer_args, get_eval_args
|
||||
from llmtuner.model.utils import dispatch_model, generate_model_card
|
||||
from llmtuner.model.utils import create_ref_model, create_reward_model, dispatch_model, generate_model_card
|
||||
|
||||
Reference in New Issue
Block a user