update packing with sdpa and eager attention mode

Former-commit-id: 285636ba3a57a1038b2f2fd4cf909a1ca07708d4
This commit is contained in:
ancv
2024-06-16 02:25:47 +07:00
parent f91fe10985
commit dd7a1dbfae
3 changed files with 148 additions and 73 deletions

View File

@@ -66,6 +66,21 @@ STAGES_USE_PAIR_DATA = {"rm", "dpo"}
SUPPORTED_CLASS_FOR_S2ATTN = {"llama"}
SUPPORTED_CLASS_FOR_MULTIPACK = [
"llama",
"mistral",
"mixtral",
"qwen2",
"qwen2_moe",
"falcon",
"phi",
"phi3",
"gemma",
"gemmoe",
"starcoder2",
"jamba"
]
V_HEAD_WEIGHTS_NAME = "value_head.bin"
V_HEAD_SAFE_WEIGHTS_NAME = "value_head.safetensors"