[data] optimize qwen3 loss computation (#7923)

2026-02-02 08:33:38 +00:00 · 2025-04-30 16:18:00 +08:00
parent 73198a6645
commit 052ca871bd
11 changed files with 205 additions and 39 deletions
--- a/src/llamafactory/webui/chatter.py
+++ b/src/llamafactory/webui/chatter.py
@@ -191,6 +191,7 @@ class WebChatModel(ChatModel):
        temperature: float,
        skip_special_tokens: bool,
        escape_html: bool,
+        enable_thinking: bool,
    ) -> Generator[tuple[list[dict[str, str]], list[dict[str, str]]], None, None]:
        r"""Generate output text in stream.

@@ -210,6 +211,7 @@ class WebChatModel(ChatModel):
            top_p=top_p,
            temperature=temperature,
            skip_special_tokens=skip_special_tokens,
+            enable_thinking=enable_thinking,
        ):
            response += new_text
            if tools: