update webui
Former-commit-id: da30d0fb4abdb825f3383ddd106bb06a84695b7a
This commit is contained in:
@@ -10,7 +10,13 @@ LAYERNORM_NAMES = ["norm", "ln_f", "ln_attn", "ln_mlp"]
|
||||
|
||||
METHODS = ["full", "freeze", "lora"]
|
||||
|
||||
STAGES = ["Supervised Finetuning", "Reward Modeling", "PPO", "DPO", "Pretraining"]
|
||||
STAGES = [
|
||||
"SFT",
|
||||
"Reward Modeling",
|
||||
"PPO",
|
||||
"DPO",
|
||||
"Pre-Training"
|
||||
]
|
||||
|
||||
SUPPORTED_MODELS = {
|
||||
"LLaMA-7B": "huggyllama/llama-7b",
|
||||
@@ -23,6 +29,10 @@ SUPPORTED_MODELS = {
|
||||
"LLaMA2-7B-Chat": "meta-llama/Llama-2-7b-chat-hf",
|
||||
"LLaMA2-13B-Chat": "meta-llama/Llama-2-13b-chat-hf",
|
||||
"LLaMA2-70B-Chat": "meta-llama/Llama-2-70b-chat-hf",
|
||||
"ChineseLLaMA2-7B": "ziqingyang/chinese-llama-2-7b",
|
||||
"ChineseLLaMA2-13B": "ziqingyang/chinese-llama-2-13b",
|
||||
"ChineseLLaMA2-7B-Chat": "ziqingyang/chinese-alpaca-2-7b",
|
||||
"ChineseLLaMA2-13B-Chat": "ziqingyang/chinese-alpaca-2-13b",
|
||||
"BLOOM-560M": "bigscience/bloom-560m",
|
||||
"BLOOM-3B": "bigscience/bloom-3b",
|
||||
"BLOOM-7B1": "bigscience/bloom-7b1",
|
||||
@@ -41,12 +51,13 @@ SUPPORTED_MODELS = {
|
||||
"Qwen-7B": "Qwen/Qwen-7B",
|
||||
"Qwen-7B-Chat": "Qwen/Qwen-7B-Chat",
|
||||
"XVERSE-13B": "xverse/XVERSE-13B",
|
||||
"ChatGLM2-6B": "THUDM/chatglm2-6b"
|
||||
"ChatGLM2-6B-Chat": "THUDM/chatglm2-6b"
|
||||
}
|
||||
|
||||
DEFAULT_MODULE = {
|
||||
"LLaMA": "q_proj,v_proj",
|
||||
"LLaMA2": "q_proj,v_proj",
|
||||
"ChineseLLaMA2": "q_proj,v_proj",
|
||||
"BLOOM": "query_key_value",
|
||||
"BLOOMZ": "query_key_value",
|
||||
"Falcon": "query_key_value",
|
||||
@@ -59,28 +70,9 @@ DEFAULT_MODULE = {
|
||||
|
||||
DEFAULT_TEMPLATE = {
|
||||
"LLaMA2": "llama2",
|
||||
"ChineseLLaMA2": "llama2_zh",
|
||||
"Baichuan": "baichuan",
|
||||
"InternLM": "intern",
|
||||
"Qwen": "chatml",
|
||||
"ChatGLM2": "chatglm2"
|
||||
}
|
||||
|
||||
# huggingface model name prefix 2 template
|
||||
DEFAULT_TEMPLATE_WITH_CUSTOM_MODEL = {
|
||||
"Llama-2": "llama2",
|
||||
"chinese-alpaca-2": "llama2_zh",
|
||||
"alpaca-7b-wdiff": "alpaca",
|
||||
"vicuna": "vicuna",
|
||||
"BELLE": "belle",
|
||||
"Chinese-LLaMA-2": "linly",
|
||||
"BiLLa": "billa",
|
||||
"Ziya": "ziya",
|
||||
"aquilachat": "aquila",
|
||||
"internlm": "intern",
|
||||
"aquilachat": "aquila",
|
||||
"internlm": "intern",
|
||||
"Baichuan":"baichuan",
|
||||
"starchat":"starchat",
|
||||
"Qwen":"chatml",
|
||||
"chatglm2":"chatglm2"
|
||||
}
|
||||
Reference in New Issue
Block a user