[assets] update wechat (#8385)

This commit is contained in:
Yaowei Zheng
2025-06-16 18:23:22 +08:00
committed by GitHub
parent 8e4ac78607
commit 9a2d1dec62
5 changed files with 21 additions and 11 deletions

View File

@@ -204,7 +204,12 @@ class RLHFArguments:
)
ld_alpha: Optional[float] = field(
default=None,
metadata={"help": "α parameter from the LD-DPO paper, which controls the weighting of the verbose token log-probabilities in responses"},
metadata={
"help": (
"Alpha parameter from the LD-DPO paper, which controls the weighting of"
" the verbose token log-probabilities in responses."
)
},
)