support deepseek-v3-20250324

2025-03-25 14:51:28 +08:00
parent ba2da2f4ed
commit 93fcd77544
17 changed files with 2050 additions and 485 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -1,3 +1,5 @@
 node_modules
 .env
 log.txt
+.idea
+dist
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -1,25 +0,0 @@
-# CLAUDE.md
-
-## Build/Lint/Test Commands
- Install dependencies: `npm i`
- Start server: `node index.mjs` (requires OPENAI_API_KEY, OPENAI_BASE_URL, OPENAI_MODEL env vars)
- Set environment variables:
-  ```shell
-  export DISABLE_PROMPT_CACHING=1
-  export ANTHROPIC_AUTH_TOKEN="test"
-  export ANTHROPIC_BASE_URL="http://127.0.0.1:3456"
-  export API_TIMEOUT_MS=600000
-  ```
-
-## Code Style Guidelines
- Follow existing formatting in README.md and other files
- Use ES module syntax (`import`/`export`)
- Environment variables are uppercase with underscores
- API endpoints use `/v1/` prefix
- JSON payloads follow strict structure with model, max_tokens, messages, system, etc.
- Include type information in JSON payloads where possible
- Use descriptive variable names
- Keep code modular - separate files for router, index, etc.
- Include example usage/documentation in README
- Use markdown code blocks for code samples
- Document API endpoints and parameters
--- a/README.md
+++ b/README.md
@@ -2,13 +2,13 @@

 > This is a repository for testing routing Claude Code requests to different models.

-![demo.png](https://github.com/musistudio/claude-code-reverse/blob/main/screenshoots/demo.png)
+![demo.png](https://github.com/musistudio/claude-code-router/blob/main/screenshoots/demo.png)

 ## Warning! This project is for testing purposes and may consume a lot of tokens! It may also fail to complete tasks!

 ## Implemented

- [x] Mormal Mode and Router Mode
+- [x] Normal Mode and Router Mode

 - [x] Using the qwen2.5-coder-3b model as the routing dispatcher (since it’s currently free on Alibaba Cloud’s official website)

@@ -30,56 +30,22 @@ Thanks to the free qwen2.5-coder-3b model from Alibaba and deepseek’s KV-Cache
 npm install -g @anthropic-ai/claude-code
 ```

-1. Clone this repo
+1. Install claude-code-router

 ```shell
-git clone https://github.com/musistudio/claude-code-reverse.git
+npm install -g @musistudio/claude-code-router
 ```

-2. Install dependencies
+2. Start claude-code-router server

 ```shell
-npm i
+claude-code-router
 ```

-3. Start server
-
-```shell
-# Alternatively, you can create an .env file in the repo directory
-# You can refer to the .env.example file to create the .env file
-
-## disable router
-ENABLE_ROUTER=false
-OPENAI_API_KEY=""
-OPENAI_BASE_URL=""
-OPENAI_MODEL=""
-
-## enable router
-ENABLE_ROUTER=true
-export TOOL_AGENT_API_KEY=""
-export TOOL_AGENT_BASE_URL=""
-export TOOL_AGENT_MODEL="qwen-max-2025-01-25"
-
-export CODER_AGENT_API_KEY=""
-export CODER_AGENT_BASE_URL="https://api.deepseek.com"
-export CODER_AGENT_MODEL="deepseek-chat"
-
-export THINK_AGENT_API_KEY=""
-export THINK_AGENT_BASE_URL="https://api.deepseek.com"
-export THINK_AGENT_MODEL="deepseek-reasoner"
-
-export ROUTER_AGENT_API_KEY=""
-export ROUTER_AGENT_BASE_URL=""
-export ROUTER_AGENT_MODEL="qwen2.5-coder-3b-instruct"
-
-node index.mjs
-```
-
-4. Set environment variable to start claude code
+3. Set environment variable to start claude code

 ```shell
 export DISABLE_PROMPT_CACHING=1
-export ANTHROPIC_AUTH_TOKEN="test"
 export ANTHROPIC_BASE_URL="http://127.0.0.1:3456"
 export API_TIMEOUT_MS=600000
 claude
@@ -102,4 +68,4 @@ CODER_AGENT_MODEL and THINK_AGENT_MODEL can use the DeepSeek series of models.

 The purpose of router mode is to separate tool invocation from coding tasks, enabling the use of inference models like r1, which do not support function calling.

-![router mode](https://github.com/musistudio/claude-code-reverse/blob/main/screenshoots/router.png)
+![router mode](https://github.com/musistudio/claude-code-router/blob/main/screenshoots/router.png)
--- a/index.mjs
+++ b/index.mjs
@@ -1,330 +0,0 @@
-import express from "express";
-import { OpenAI } from "openai";
-import dotenv from "dotenv";
-import { existsSync } from "fs";
-import { writeFile } from "fs/promises";
-import { Router } from "./router.mjs";
-import { getOpenAICommonOptions } from "./utils.mjs";
-
-dotenv.config();
-const app = express();
-const port = 3456;
-app.use(express.json({ limit: "500mb" }));
-
-let client;
-if (process.env.ENABLE_ROUTER && process.env.ENABLE_ROUTER === "true") {
-  const router = new Router();
-  client = {
-    call: (data) => {
-      return router.route(data);
-    },
-  };
-} else {
-  const openai = new OpenAI({
-    apiKey: process.env.OPENAI_API_KEY,
-    baseURL: process.env.OPENAI_BASE_URL,
-    ...getOpenAICommonOptions(),
-  });
-  client = {
-    call: (data) => {
-      data.model = process.env.OPENAI_MODEL;
-      return openai.chat.completions.create(data);
-    },
-  };
-}
-
-app.post("/v1/messages", async (req, res) => {
-  try {
-    let {
-      model,
-      max_tokens,
-      messages,
-      system = [],
-      temperature,
-      metadata,
-      tools,
-    } = req.body;
-
-    messages = messages.map((item) => {
-      if (item.content instanceof Array) {
-        return {
-          role: item.role,
-          content: item.content.map((it) => {
-            const msg = {
-              ...it,
-              type: ["tool_result", "tool_use"].includes(it?.type)
-                ? "text"
-                : it?.type,
-            };
-            if (msg.type === "text") {
-              msg.text = it?.content
-                ? JSON.stringify(it.content)
-                : it?.text || "";
-              delete msg.content;
-            }
-            return msg;
-          }),
-        };
-      }
-      return {
-        role: item.role,
-        content: item.content,
-      };
-    });
-    const data = {
-      model,
-      messages: [
-        ...system.map((item) => ({
-          role: "system",
-          content: item.text,
-        })),
-        ...messages,
-      ],
-      temperature,
-      stream: true,
-    };
-    if (tools) {
-      data.tools = tools
-        .filter((tool) => !["StickerRequest"].includes(tool.name))
-        .map((item) => ({
-          type: "function",
-          function: {
-            name: item.name,
-            description: item.description,
-            parameters: item.input_schema,
-          },
-        }));
-    }
-    const completion = await client.call(data);
-
-    // Set SSE response headers
-    res.setHeader("Content-Type", "text/event-stream");
-    res.setHeader("Cache-Control", "no-cache");
-    res.setHeader("Connection", "keep-alive");
-
-    const messageId = "msg_" + Date.now();
-    let contentBlockIndex = 0;
-    let currentContentBlocks = [];
-
-    // Send message_start event
-    const messageStart = {
-      type: "message_start",
-      message: {
-        id: messageId,
-        type: "message",
-        role: "assistant",
-        content: [],
-        model,
-        stop_reason: null,
-        stop_sequence: null,
-        usage: { input_tokens: 1, output_tokens: 1 },
-      },
-    };
-    res.write(
-      `event: message_start\ndata: ${JSON.stringify(messageStart)}\n\n`
-    );
-
-    let isToolUse = false;
-    let toolUseJson = "";
-    let currentToolCall = null;
-    let hasStartedTextBlock = false;
-
-    for await (const chunk of completion) {
-      const delta = chunk.choices[0].delta;
-      if (delta.tool_calls && delta.tool_calls.length > 0) {
-        const toolCall = delta.tool_calls[0];
-
-        if (!isToolUse) {
-          // Start new tool call block
-          isToolUse = true;
-          currentToolCall = toolCall;
-
-          const toolBlockStart = {
-            type: "content_block_start",
-            index: contentBlockIndex,
-            content_block: {
-              type: "tool_use",
-              id: `toolu_${Date.now()}`,
-              name: toolCall.function.name,
-              input: {},
-            },
-          };
-
-          // Add to content blocks list
-          currentContentBlocks.push({
-            type: "tool_use",
-            id: toolBlockStart.content_block.id,
-            name: toolCall.function.name,
-            input: {},
-          });
-
-          res.write(
-            `event: content_block_start\ndata: ${JSON.stringify(
-              toolBlockStart
-            )}\n\n`
-          );
-          toolUseJson = "";
-        }
-
-        // Stream tool call JSON
-        if (toolCall.function.arguments) {
-          const jsonDelta = {
-            type: "content_block_delta",
-            index: contentBlockIndex,
-            delta: {
-              type: "input_json_delta",
-              partial_json: toolCall.function.arguments,
-            },
-          };
-
-          toolUseJson += toolCall.function.arguments;
-
-          // Try to parse complete JSON and update content block
-          try {
-            const parsedJson = JSON.parse(toolUseJson);
-            currentContentBlocks[contentBlockIndex].input = parsedJson;
-          } catch (e) {
-            // JSON not yet complete, continue accumulating
-          }
-
-          res.write(
-            `event: content_block_delta\ndata: ${JSON.stringify(jsonDelta)}\n\n`
-          );
-        }
-      } else if (delta.content) {
-        // Handle regular text content
-        if (isToolUse) {
-          // End previous tool call block
-          const contentBlockStop = {
-            type: "content_block_stop",
-            index: contentBlockIndex,
-          };
-
-          res.write(
-            `event: content_block_stop\ndata: ${JSON.stringify(
-              contentBlockStop
-            )}\n\n`
-          );
-          contentBlockIndex++;
-          isToolUse = false;
-        }
-
-        if (!delta.content) continue;
-
-        // If text block not yet started, send content_block_start
-        if (!hasStartedTextBlock) {
-          const textBlockStart = {
-            type: "content_block_start",
-            index: contentBlockIndex,
-            content_block: {
-              type: "text",
-              text: "",
-            },
-          };
-
-          // Add to content blocks list
-          currentContentBlocks.push({
-            type: "text",
-            text: "",
-          });
-
-          res.write(
-            `event: content_block_start\ndata: ${JSON.stringify(
-              textBlockStart
-            )}\n\n`
-          );
-          hasStartedTextBlock = true;
-        }
-
-        // Send regular text content
-        const contentDelta = {
-          type: "content_block_delta",
-          index: contentBlockIndex,
-          delta: {
-            type: "text_delta",
-            text: delta.content,
-          },
-        };
-
-        // Update content block text
-        if (currentContentBlocks[contentBlockIndex]) {
-          currentContentBlocks[contentBlockIndex].text += delta.content;
-        }
-
-        res.write(
-          `event: content_block_delta\ndata: ${JSON.stringify(
-            contentDelta
-          )}\n\n`
-        );
-      }
-    }
-
-    // Close last content block
-    const contentBlockStop = {
-      type: "content_block_stop",
-      index: contentBlockIndex,
-    };
-
-    res.write(
-      `event: content_block_stop\ndata: ${JSON.stringify(contentBlockStop)}\n\n`
-    );
-
-    // Send message_delta event with appropriate stop_reason
-    const messageDelta = {
-      type: "message_delta",
-      delta: {
-        stop_reason: isToolUse ? "tool_use" : "end_turn",
-        stop_sequence: null,
-        content: currentContentBlocks,
-      },
-      usage: { input_tokens: 100, output_tokens: 150 },
-    };
-
-    res.write(
-      `event: message_delta\ndata: ${JSON.stringify(messageDelta)}\n\n`
-    );
-
-    // Send message_stop event
-    const messageStop = {
-      type: "message_stop",
-    };
-
-    res.write(`event: message_stop\ndata: ${JSON.stringify(messageStop)}\n\n`);
-    res.end();
-  } catch (error) {
-    console.error("Error in streaming response:", error);
-    res.status(400).json({
-      status: "error",
-      message: error.message,
-    });
-  }
-});
-
-async function initializeClaudeConfig() {
-  const homeDir = process.env.HOME;
-  const configPath = `${homeDir}/.claude.json`;
-  if (!existsSync(configPath)) {
-    const userID = Array.from(
-      { length: 64 },
-      () => Math.random().toString(16)[2]
-    ).join("");
-    const configContent = {
-      numStartups: 184,
-      autoUpdaterStatus: "enabled",
-      userID,
-      hasCompletedOnboarding: true,
-      lastOnboardingVersion: "0.2.9",
-      projects: {},
-    };
-    await writeFile(configPath, JSON.stringify(configContent, null, 2));
-  }
-}
-
-async function run() {
-  await initializeClaudeConfig();
-
-  app.listen(port, "127.0.0.1", () => {
-    console.log(`Example app listening on port ${port}`);
-  });
-}
-run();
--- a/package.json
+++ b/package.json
@@ -1,19 +1,35 @@
 {
  "name": "claude-code-router",
  "version": "1.0.0",
-  "description": "You can switch the API endpoint by modifying the ANTHROPIC_BASE_URL environment variable.",
-  "main": "index.mjs",
-  "scripts": {
-    "test": "echo \"Error: no test specified\" && exit 1",
-    "start": "node index.mjs"
+  "description": "Use Claude Code without an Anthropics account and route it to another LLM provider",
+  "bin": {
+    "claude-code-router": "./dist/cli.js"
  },
-  "keywords": [],
-  "author": "",
-  "license": "ISC",
+  "scripts": {
+    "start": "node dist/cli.js",
+    "build": "tsc && esbuild src/index.ts --bundle --platform=node --outfile=dist/cli.js"
+  },
+  "keywords": ["claude", "code", "router", "llm", "anthropic"],
+  "author": "musistudio",
+  "license": "MIT",
  "dependencies": {
+    "@anthropic-ai/claude-code": "^0.2.53",
+    "@anthropic-ai/sdk": "^0.39.0",
    "dotenv": "^16.4.7",
    "express": "^4.21.2",
    "https-proxy-agent": "^7.0.6",
    "openai": "^4.85.4"
+  },
+  "devDependencies": {
+    "@types/express": "^5.0.0",
+    "esbuild": "^0.25.1",
+    "typescript": "^5.8.2"
+  },
+  "publishConfig": {
+    "ignore": [
+      "!build/",
+      "src/",
+      "screenshots/"
+    ]
  }
 }
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
--- a/src/constants.ts
+++ b/src/constants.ts
@@ -0,0 +1,28 @@
+import path from "node:path";
+import os from "node:os";
+
+export const HOME_DIR = path.join(os.homedir(), ".claude-code-router");
+
+export const CONFIG_FILE = `${HOME_DIR}/config.json`;
+
+export const PROMPTS_DIR = `${HOME_DIR}/prompts`;
+
+export const DEFAULT_CONFIG = {
+  log: false,
+  ENABLE_ROUTER: true,
+  OPENAI_API_KEY: "",
+  OPENAI_BASE_URL: "https://openrouter.ai/api/v1",
+  OPENAI_MODEL: "openai/o3-mini",
+
+  CODER_AGENT_API_KEY: "",
+  CODER_AGENT_BASE_URL: "https://api.deepseek.com",
+  CODER_AGENT_MODEL: "deepseek-chat",
+
+  THINK_AGENT_API_KEY: "",
+  THINK_AGENT_BASE_URL: "https://api.deepseek.com",
+  THINK_AGENT_MODEL: "deepseek-reasoner",
+
+  ROUTER_AGENT_API_KEY: "",
+  ROUTER_AGENT_BASE_URL: "https://api.deepseek.com",
+  ROUTER_AGENT_MODEL: "deepseek-chat",
+};
--- a/src/deepseek.ts
+++ b/src/deepseek.ts
@@ -0,0 +1,140 @@
+import { OpenAI } from "openai";
+import { createClient } from "./utils";
+import { log } from "./utils/log";
+export interface BaseRouter {
+  name: string;
+  description: string;
+  run: (
+    args: OpenAI.Chat.Completions.ChatCompletionCreateParams
+  ) => Promise<any>;
+}
+
+const thinkRouter: BaseRouter = {
+  name: "think",
+  description: `This agent is used solely for complex reasoning and thinking tasks. It should not be called for information retrieval or repetitive, frequent requests. Only use this agent for tasks that require deep analysis or problem-solving. If there is an existing result from the Thinker agent, do not call this agent again.你只负责深度思考以拆分任务，不需要进行任何的编码和调用工具。最后讲拆分的步骤按照顺序返回。比如\n1. xxx\n2. xxx\n3. xxx`,
+  run(args) {
+    const client = createClient({
+      apiKey: process.env.THINK_AGENT_API_KEY,
+      baseURL: process.env.THINK_AGENT_BASE_URL,
+    });
+    const messages = JSON.parse(JSON.stringify(args.messages));
+    messages.forEach((msg: any) => {
+      if (Array.isArray(msg.content)) {
+        msg.content = JSON.stringify(msg.content);
+      }
+    });
+
+    let startIdx = messages.findIndex((msg: any) => msg.role !== "system");
+    if (startIdx === -1) startIdx = messages.length;
+
+    for (let i = startIdx; i < messages.length; i++) {
+      const expectedRole = (i - startIdx) % 2 === 0 ? "user" : "assistant";
+      messages[i].role = expectedRole;
+    }
+
+    if (
+      messages.length > 0 &&
+      messages[messages.length - 1].role === "assistant"
+    ) {
+      messages.push({
+        role: "user",
+        content:
+          "Please follow the instructions provided above to resolve the issue.",
+      });
+    }
+    delete args.tools;
+    return client.chat.completions.create({
+      ...args,
+      messages,
+      model: process.env.THINK_AGENT_MODEL as string,
+    });
+  },
+};
+
+export class Router {
+  routers: BaseRouter[];
+  client: OpenAI;
+  constructor() {
+    this.routers = [thinkRouter];
+    this.client = createClient({
+      apiKey: process.env.ROUTER_AGENT_API_KEY,
+      baseURL: process.env.ROUTER_AGENT_BASE_URL,
+    });
+  }
+  async route(
+    args: OpenAI.Chat.Completions.ChatCompletionCreateParams
+  ): Promise<any> {
+    log(`Request Router: ${JSON.stringify(args, null, 2)}`);
+    const res: OpenAI.Chat.Completions.ChatCompletion =
+      await this.client.chat.completions.create({
+        ...args,
+        messages: [
+          ...args.messages,
+          {
+            role: "system",
+            content: `## **Guidelines:**  
+- **Trigger the "think" mode when the user's request involves deep thinking, complex reasoning, or multi-step analysis.**  
+- **Criteria:**  
+    - Involves multi-layered logical reasoning or causal analysis  
+    - Requires establishing connections or pattern recognition between different pieces of information  
+    - Involves cross-domain knowledge integration or weighing multiple possibilities  
+    - Requires creative thinking or non-direct inference  
+### **Format requirements:**  
+- When you need to trigger the "think" mode, return the following JSON format:  
+\`\`\`json
+{
+  "use": "think"
+}
+\`\`\`
+`,
+          },
+        ],
+        model: process.env.ROUTER_AGENT_MODEL as string,
+        stream: false,
+      });
+    let result;
+    try {
+      const text = res.choices[0].message.content;
+      if (!text) {
+        throw new Error("No text");
+      }
+      result = JSON.parse(
+        text.slice(text.indexOf("{"), text.lastIndexOf("}") + 1)
+      );
+    } catch (e) {
+      (res.choices[0] as any).delta = res.choices[0].message;
+      log(`No Router: ${JSON.stringify(res.choices[0].message)}`);
+      return [res];
+    }
+    const router = this.routers.find((item) => item.name === result.use);
+    if (!router) {
+      (res.choices[0] as any).delta = res.choices[0].message;
+      log(`No Router: ${JSON.stringify(res.choices[0].message)}`);
+      return [res];
+    }
+    log(`Use Router: ${router.name}`);
+    if (router.name === "think") {
+      const agentResult = await router.run({
+        ...args,
+        stream: false,
+      });
+      try {
+        args.messages.push({
+          role: "user",
+          content:
+            `${router.name} Agent Result: ` +
+            agentResult.choices[0].message.content,
+        });
+        log(
+          `${router.name} Agent Result: ` +
+            agentResult.choices[0].message.content
+        );
+        return await this.route(args);
+      } catch (error) {
+        console.log(agentResult);
+        throw error;
+      }
+    }
+    return router.run(args);
+  }
+}
--- a/src/index.ts
+++ b/src/index.ts
@@ -0,0 +1,35 @@
+import { existsSync } from "fs";
+import { writeFile } from "fs/promises";
+import { initConfig, initDir } from "./utils";
+import { createServer } from "./server";
+import { rewriteToolsPrompt } from "./middlewares/rewriteToolsPrompt";
+
+async function initializeClaudeConfig() {
+  const homeDir = process.env.HOME;
+  const configPath = `${homeDir}/.claude.json`;
+  if (!existsSync(configPath)) {
+    const userID = Array.from(
+      { length: 64 },
+      () => Math.random().toString(16)[2]
+    ).join("");
+    const configContent = {
+      numStartups: 184,
+      autoUpdaterStatus: "enabled",
+      userID,
+      hasCompletedOnboarding: true,
+      lastOnboardingVersion: "0.2.9",
+      projects: {},
+    };
+    await writeFile(configPath, JSON.stringify(configContent, null, 2));
+  }
+}
+
+async function run() {
+  await initializeClaudeConfig();
+  await initDir();
+  await initConfig();
+  const server = createServer(3456);
+  server.useMiddleware(rewriteToolsPrompt);
+  server.start();
+}
+run();
--- a/src/middlewares/rewriteToolsPrompt.ts
+++ b/src/middlewares/rewriteToolsPrompt.ts
@@ -0,0 +1,34 @@
+import { Request, Response, NextFunction } from "express";
+import { readFile, access } from "node:fs/promises";
+import { join } from "node:path";
+import { PROMPTS_DIR } from "../constants";
+
+const getPrompt = async (name: string) => {
+  try {
+    const promptPath = join(PROMPTS_DIR, `${name}.md`);
+    await access(promptPath);
+    const prompt = await readFile(promptPath, "utf-8");
+    return prompt;
+  } catch {
+    return null;
+  }
+};
+
+export const rewriteToolsPrompt = async (
+  req: Request,
+  res: Response,
+  next: NextFunction
+) => {
+  const { tools } = req.body;
+  if (!Array.isArray(tools)) {
+    next();
+    return;
+  }
+  for (const tool of tools) {
+    const prompt = await getPrompt(tool.name);
+    if (prompt) {
+      tool.description = prompt;
+    }
+  }
+  next();
+};
--- a/src/router
+++ b/src/router
@@ -1,38 +1,21 @@
 import { OpenAI } from "openai";
-import { getOpenAICommonOptions } from "./utils.mjs";
+import { createClient } from "./utils";
+import { log } from "./utils/log";
+export interface BaseRouter {
+  name: string;
+  description: string;
+  run: (
+    args: OpenAI.Chat.Completions.ChatCompletionCreateParams
+  ) => Promise<any>;
+}

-const useToolRouter = {
-  name: "use-tool",
-  description: `This agent can call user-specified tools to perform tasks. The user provides a list of tools to be used, and the agent integrates these tools to complete the specified tasks efficiently. The agent follows user instructions and ensures proper tool utilization for each request`,
-  run(args) {
-    const client = new OpenAI({
-      apiKey: process.env.TOOL_AGENT_API_KEY,
-      baseURL: process.env.TOOL_AGENT_BASE_URL,
-      ...getOpenAICommonOptions(),
-    });
-    return client.chat.completions.create({
-      ...args,
-      messages: [
-        ...args.messages,
-        {
-          role: "system",
-          content:
-            "You need to select the appropriate tool for the task based on the user’s request. Review the requirements and choose the tool that fits the task best.",
-        },
-      ],
-      model: process.env.TOOL_AGENT_MODEL,
-    });
-  },
-};
-
-const coderRouter = {
+const coderRouter: BaseRouter = {
  name: "coder",
-  description: `This agent is solely responsible for helping users write code. This agent could not call tools. This agent is used for writing and modifying code when the user provides clear and specific coding requirements. For example, tasks like implementing a quicksort algorithm in JavaScript or creating an HTML layout. If the user's request is unclear or cannot be directly translated into code, please route the task to 'Thinker' first for clarification or further processing.`,
+  description: `This agent is solely responsible for helping users write code. This agent could not call tools. This agent is used for writing and modifying code when the user provides clear and specific coding requirements. For example, tasks like implementing a quicksort algorithm in JavaScript or creating an HTML layout. If the user's request is unclear or cannot be directly translated into code, please route the task to 'think' first for clarification or further processing.`,
  run(args) {
-    const client = new OpenAI({
+    const client = createClient({
      apiKey: process.env.CODER_AGENT_API_KEY,
      baseURL: process.env.CODER_AGENT_BASE_URL,
-      ...getOpenAICommonOptions(),
    });
    delete args.tools;
    args.messages.forEach((item) => {
@@ -50,28 +33,51 @@ const coderRouter = {
            "You are a code writer who helps users write code based on their specific requirements. You create algorithms, implement functionality, and build structures according to the clear instructions provided by the user. Your focus is solely on writing code, ensuring that the task is completed accurately and efficiently.",
        },
      ],
-      model: process.env.CODER_AGENT_MODEL,
+      model: process.env.CODER_AGENT_MODEL as string,
    });
  },
 };

-const thinkRouter = {
-  name: "thinker",
-  description: `This agent is used solely for complex reasoning and thinking tasks. It should not be called for information retrieval or repetitive, frequent requests. Only use this agent for tasks that require deep analysis or problem-solving. If there is an existing result from the Thinker agent, do not call this agent again.`,
+
+const useToolRouter: BaseRouter = {
+  name: "use-tool",
+  description: `This agent can call user-specified tools to perform tasks. The user provides a list of tools to be used, and the agent integrates these tools to complete the specified tasks efficiently. The agent follows user instructions and ensures proper tool utilization for each request`,
  run(args) {
-    const client = new OpenAI({
+    const client = createClient({
+      apiKey: process.env.TOOL_AGENT_API_KEY,
+      baseURL: process.env.TOOL_AGENT_BASE_URL,
+    });
+    return client.chat.completions.create({
+      ...args,
+      messages: [
+        ...args.messages,
+        {
+          role: "system",
+          content:
+            "You need to select the appropriate tool for the task based on the user’s request. Review the requirements and choose the tool that fits the task best.",
+        },
+      ],
+      model: process.env.TOOL_AGENT_MODEL as string,
+    });
+  },
+};
+
+const thinkRouter: BaseRouter = {
+  name: "think",
+  description: `This agent is used solely for complex reasoning and thinking tasks. It should not be called for information retrieval or repetitive, frequent requests. Only use this agent for tasks that require deep analysis or problem-solving. If there is an existing result from the Thinker agent, do not call this agent again.你只负责深度思考以拆分任务，不需要进行任何的编码和调用工具。最后讲拆分的步骤按照顺序返回。比如\n1. xxx\n2. xxx\n3. xxx`,
+  run(args) {
+    const client = createClient({
      apiKey: process.env.THINK_AGENT_API_KEY,
      baseURL: process.env.THINK_AGENT_BASE_URL,
-      ...getOpenAICommonOptions(),
    });
    const messages = JSON.parse(JSON.stringify(args.messages));
-    messages.forEach((msg) => {
+    messages.forEach((msg: any) => {
      if (Array.isArray(msg.content)) {
        msg.content = JSON.stringify(msg.content);
      }
    });

-    let startIdx = messages.findIndex((msg) => msg.role !== "system");
+    let startIdx = messages.findIndex((msg: any) => msg.role !== "system");
    if (startIdx === -1) startIdx = messages.length;

    for (let i = startIdx; i < messages.length; i++) {
@@ -93,73 +99,102 @@ const thinkRouter = {
    return client.chat.completions.create({
      ...args,
      messages,
-      model: process.env.THINK_AGENT_MODEL,
+      model: process.env.THINK_AGENT_MODEL as string,
    });
  },
 };

 export class Router {
+  routers: BaseRouter[];
+  client: OpenAI;
  constructor() {
-    this.routers = [useToolRouter, coderRouter, thinkRouter];
-    this.client = new OpenAI({
+    this.routers = [coderRouter, useToolRouter, thinkRouter];
+    this.client = createClient({
      apiKey: process.env.ROUTER_AGENT_API_KEY,
      baseURL: process.env.ROUTER_AGENT_BASE_URL,
-      ...getOpenAICommonOptions(),
    });
  }
-  async route(args) {
-    const res = await this.client.chat.completions.create({
+  async route(
+    args: OpenAI.Chat.Completions.ChatCompletionCreateParams
+  ): Promise<any> {
+    log(`Route: ${JSON.stringify(args, null, 2)}`);
+    const res: OpenAI.Chat.Completions.ChatCompletion =
+      await this.client.chat.completions.create({
        ...args,
        messages: [
          ...args.messages,
          {
            role: "system",
-          content: `You are an AI task router that receives user requests and forwards them to the appropriate AI models for task handling. You do not process any requests directly but are responsible for understanding the user's request and choosing the correct router based on the task and necessary steps. The available routers are: ${JSON.stringify(
-            this.routers.map((router) => {
-              return {
-                name: router.name,
-                description: router.description,
-              };
-            })
-          )}. Each router is designated for specific types of tasks, and you ensure that the request is routed accordingly for efficient processing. Use the appropriate router based on the user’s request:
+            content: `You are an AI task router and executor, responsible for understanding user requests and directing them to the appropriate processing mode or tool based on the task type and requirements. Your main responsibility is to determine the nature of the request, execute the task when possible, and respond appropriately.

-If external tools are needed to gather more information, use the 'use-tool' router.
-If the task involves writing code, use the 'coder' router.
-If deep reasoning or analysis is required to break down steps, use the 'thinker' router.
-Instead, format your response as a JSON object with one field: 'use' (string)`,
+### **Guidelines:**
+- **If an external tool is required to complete the task (such as searching for information, generating images, or modifying code), route the task to \`use-tool\` rather than handling it directly.**  
+- If the task requires generating an image, route to \`use-tool\` and specify the image generation tool.  
+- If the task requires searching for information, route to \`use-tool\` and specify the search tool.  
+- If the task requires modifying or executing code, route to \`use-tool\` and specify the code handling tool.  
+- **Do NOT execute the tool action directly; always trigger it through \`use-tool\`.**  
+
+- **If the user is chatting casually or having a general conversation, respond naturally and conversationally. Improving the user experience through friendly interactions is one of your main responsibilities.**  
+
+- **If the user's request involves deep thinking, complex reasoning, or multi-step analysis, use the "think" mode to break down and solve the problem.**  
+
+- **If the user's request involves coding or technical implementation, use the "coder" mode to generate or modify code.**  
+   - **After generating the code, if the task requires applying or integrating the code, route to \`use-tool\` and specify the code execution tool.**  
+   - **Do NOT re-trigger "coder" to apply code — route to \`use-tool\` instead.**  
+
+### **Format requirements:**
+- When you need to trigger a specific mode (such as "think", "coder", or "use-tool"), return the following JSON format:
+
+### IMPORTANT:
+- 你不能也不会调用BatchTool，如果你需要使用工具请路由到\`use-tool\`，由\`use-tool\`来调用BatchTool。
+
+\`\`\`json
+{
+  "use": "<mode-name>",
+}
+\`\`\`
+`,
          },
        ],
-      model: process.env.ROUTER_AGENT_MODEL,
+        model: process.env.ROUTER_AGENT_MODEL as string,
        stream: false,
      });
    let result;
    try {
      const text = res.choices[0].message.content;
+      if (!text) {
+        throw new Error("No text");
+      }
      result = JSON.parse(
        text.slice(text.indexOf("{"), text.lastIndexOf("}") + 1)
      );
    } catch (e) {
-      console.log(e);
-      res.choices[0].delta = res.choices[0].message;
+      (res.choices[0] as any).delta = res.choices[0].message;
      return [res];
    }
    const router = this.routers.find((item) => item.name === result.use);
    if (!router) {
-      res.choices[0].delta = res.choices[0].message;
+      (res.choices[0] as any).delta = res.choices[0].message;
+      log(`No Router: ${JSON.stringify(res.choices[0].message)}`);
      return [res];
    }
-    if (router.name === "thinker" || router.name === "coder") {
+    log(`Use Router: ${router.name}`);
+    if (router.name === "think" || router.name === "coder") {
      const agentResult = await router.run({
        ...args,
        stream: false,
      });
      try {
        args.messages.push({
-          role: "assistant",
+          role: "user",
          content:
            `${router.name} Agent Result: ` +
            agentResult.choices[0].message.content,
        });
+        log(
+          `${router.name} Agent Result: ` +
+            agentResult.choices[0].message.content
+        );
        return await this.route(args);
      } catch (error) {
        console.log(agentResult);
--- a/src/server.ts
+++ b/src/server.ts
@@ -0,0 +1,159 @@
+import express, { RequestHandler } from "express";
+import {
+  ContentBlockParam,
+  MessageCreateParamsBase,
+} from "@anthropic-ai/sdk/resources/messages";
+import { OpenAI } from "openai";
+import { Router } from "./deepseek";
+import { getOpenAICommonOptions } from "./utils";
+import { streamOpenAIResponse } from "./utils/stream";
+
+interface Client {
+  call: (
+    data: OpenAI.Chat.Completions.ChatCompletionCreateParams
+  ) => Promise<any>;
+}
+
+interface Server {
+  app: express.Application;
+  useMiddleware: (middleware: RequestHandler) => void;
+  start: () => void;
+}
+
+export const createServer = (port: number): Server => {
+  const app = express();
+  app.use(express.json({ limit: "500mb" }));
+
+  let client: Client;
+  if (process.env.ENABLE_ROUTER && process.env.ENABLE_ROUTER === "true") {
+    const router = new Router();
+    client = {
+      call: (data) => {
+        return router.route(data);
+      },
+    };
+  } else {
+    const openai = new OpenAI({
+      apiKey: process.env.OPENAI_API_KEY,
+      baseURL: process.env.OPENAI_BASE_URL,
+      ...getOpenAICommonOptions(),
+    });
+    client = {
+      call: (data) => {
+        if (process.env.OPENAI_MODEL) {
+          data.model = process.env.OPENAI_MODEL;
+        }
+        return openai.chat.completions.create(data);
+      },
+    };
+  }
+
+  app.post("/v1/messages", async (req, res) => {
+    try {
+      let {
+        model,
+        max_tokens,
+        messages,
+        system = [],
+        temperature,
+        metadata,
+        tools,
+      }: MessageCreateParamsBase = req.body;
+
+      const openAIMessages: OpenAI.Chat.Completions.ChatCompletionMessageParam[] =
+        messages.map((item) => {
+          if (item.content instanceof Array) {
+            return {
+              role: item.role,
+              content: item.content
+                .map((it: ContentBlockParam) => {
+                  if (it.type === "text") {
+                    return typeof it.text === "string"
+                      ? it.text
+                      : JSON.stringify(it);
+                  }
+                  return JSON.stringify(it);
+                })
+                .join(""),
+            } as OpenAI.Chat.Completions.ChatCompletionMessageParam;
+          }
+          return {
+            role: item.role,
+            content:
+              typeof item.content === "string"
+                ? item.content
+                : JSON.stringify(item.content),
+          };
+        });
+      const systemMessages: OpenAI.Chat.Completions.ChatCompletionMessageParam[] =
+        Array.isArray(system)
+          ? system.map((item) => ({
+              role: "system",
+              content: item.text,
+            }))
+          : [{ role: "system", content: system }];
+      const data: OpenAI.Chat.Completions.ChatCompletionCreateParams = {
+        model,
+        messages: [...systemMessages, ...openAIMessages],
+        temperature,
+        stream: true,
+      };
+      if (tools) {
+        data.tools = tools
+          .filter((tool) => !["StickerRequest"].includes(tool.name))
+          .map((item: any) => ({
+            type: "function",
+            function: {
+              name: item.name,
+              description: item.description,
+              parameters: item.input_schema,
+            },
+          }));
+      }
+      res.setHeader("Content-Type", "text/event-stream");
+      res.setHeader("Cache-Control", "no-cache");
+      res.setHeader("Connection", "keep-alive");
+      try {
+        const completion = await client.call(data);
+        await streamOpenAIResponse(res, completion, model);
+      } catch (e) {
+        console.error("Error in OpenAI API call:", e);
+      }
+    } catch (error) {
+      console.error("Error in request processing:", error);
+      const errorCompletion: AsyncIterable<OpenAI.Chat.Completions.ChatCompletionChunk> =
+        {
+          async *[Symbol.asyncIterator]() {
+            yield {
+              id: `error_${Date.now()}`,
+              created: Math.floor(Date.now() / 1000),
+              model: "gpt-3.5-turbo",
+              object: "chat.completion.chunk",
+              choices: [
+                {
+                  index: 0,
+                  delta: {
+                    content: `Error: ${(error as Error).message}`,
+                  },
+                  finish_reason: "stop",
+                },
+              ],
+            };
+          },
+        };
+      await streamOpenAIResponse(res, errorCompletion, "gpt-3.5-turbo");
+    }
+  });
+
+  return {
+    app,
+    useMiddleware: (middleware: RequestHandler) => {
+      app.use("/v1/messages", middleware);
+    },
+    start: () => {
+      app.listen(port, () => {
+        console.log(`Server is running on port ${port}`);
+      });
+    },
+  };
+};
--- a/src/utils/index.ts
+++ b/src/utils/index.ts
@@ -0,0 +1,57 @@
+import { HttpsProxyAgent } from "https-proxy-agent";
+import OpenAI, { ClientOptions } from "openai";
+import fs from "node:fs/promises";
+import {
+  CONFIG_FILE,
+  DEFAULT_CONFIG,
+  HOME_DIR,
+  PROMPTS_DIR,
+} from "../constants";
+
+export function getOpenAICommonOptions(): ClientOptions {
+  const options: ClientOptions = {};
+  if (process.env.PROXY_URL) {
+    options.httpAgent = new HttpsProxyAgent(process.env.PROXY_URL);
+  }
+  return options;
+}
+
+const ensureDir = async (dir_path: string) => {
+  try {
+    await fs.access(dir_path);
+  } catch {
+    await fs.mkdir(dir_path, { recursive: true });
+  }
+};
+
+export const initDir = async () => {
+  await ensureDir(HOME_DIR);
+  await ensureDir(PROMPTS_DIR);
+};
+
+export const readConfigFile = async () => {
+  try {
+    const config = await fs.readFile(CONFIG_FILE, "utf-8");
+    return JSON.parse(config);
+  } catch {
+    await writeConfigFile(DEFAULT_CONFIG);
+    return DEFAULT_CONFIG;
+  }
+};
+
+export const writeConfigFile = async (config: any) => {
+  await fs.writeFile(CONFIG_FILE, JSON.stringify(config, null, 2));
+};
+
+export const initConfig = async () => {
+  const config = await readConfigFile();
+  Object.assign(process.env, config);
+};
+
+export const createClient = (options: ClientOptions) => {
+  const client = new OpenAI({
+    ...options,
+    ...getOpenAICommonOptions(),
+  });
+  return client;
+};
--- a/src/utils/log.ts
+++ b/src/utils/log.ts
@@ -0,0 +1,27 @@
+import fs from 'node:fs';
+import path from 'node:path';
+import { HOME_DIR } from '../constants';
+
+const LOG_FILE = path.join(HOME_DIR, 'claude-code-router.log');
+
+// Ensure log directory exists
+if (!fs.existsSync(HOME_DIR)) {
+  fs.mkdirSync(HOME_DIR, { recursive: true });
+}
+
+export function log(...args: any[]) {
+  // Check if logging is enabled via environment variable
+  const isLogEnabled = process.env.LOG === 'true';
+  
+  if (!isLogEnabled) {
+    return;
+  }
+
+  const timestamp = new Date().toISOString();
+  const logMessage = `[${timestamp}] ${args.map(arg => 
+    typeof arg === 'object' ? JSON.stringify(arg) : String(arg)
+  ).join(' ')}\n`;
+
+  // Append to log file
+  fs.appendFileSync(LOG_FILE, logMessage, 'utf8');
+}
--- a/src/utils/stream.ts
+++ b/src/utils/stream.ts
@@ -0,0 +1,268 @@
+import { Response } from "express";
+import { OpenAI } from "openai";
+
+interface ContentBlock {
+  type: string;
+  id?: string;
+  name?: string;
+  input?: any;
+  text?: string;
+}
+
+interface MessageEvent {
+  type: string;
+  message?: {
+    id: string;
+    type: string;
+    role: string;
+    content: any[];
+    model: string;
+    stop_reason: string | null;
+    stop_sequence: string | null;
+    usage: {
+      input_tokens: number;
+      output_tokens: number;
+    };
+  };
+  delta?: {
+    stop_reason?: string;
+    stop_sequence?: string | null;
+    content?: ContentBlock[];
+    type?: string;
+    text?: string;
+    partial_json?: string;
+  };
+  index?: number;
+  content_block?: ContentBlock;
+  usage?: {
+    input_tokens: number;
+    output_tokens: number;
+  };
+}
+
+export async function streamOpenAIResponse(
+  res: Response,
+  completion: AsyncIterable<OpenAI.Chat.Completions.ChatCompletionChunk>,
+  model: string
+) {
+  const messageId = "msg_" + Date.now();
+  let contentBlockIndex = 0;
+  let currentContentBlocks: ContentBlock[] = [];
+
+  // Send message_start event
+  const messageStart: MessageEvent = {
+    type: "message_start",
+    message: {
+      id: messageId,
+      type: "message",
+      role: "assistant",
+      content: [],
+      model,
+      stop_reason: null,
+      stop_sequence: null,
+      usage: { input_tokens: 1, output_tokens: 1 },
+    },
+  };
+  res.write(`event: message_start\ndata: ${JSON.stringify(messageStart)}\n\n`);
+
+  let isToolUse = false;
+  let toolUseJson = "";
+  let hasStartedTextBlock = false;
+
+  try {
+    for await (const chunk of completion) {
+      const delta = chunk.choices[0].delta;
+
+      if (delta.tool_calls && delta.tool_calls.length > 0) {
+        const toolCall = delta.tool_calls[0];
+
+        if (!isToolUse) {
+          // Start new tool call block
+          isToolUse = true;
+          const toolBlock: ContentBlock = {
+            type: "tool_use",
+            id: `toolu_${Date.now()}`,
+            name: toolCall.function?.name,
+            input: {},
+          };
+
+          const toolBlockStart: MessageEvent = {
+            type: "content_block_start",
+            index: contentBlockIndex,
+            content_block: toolBlock,
+          };
+
+          currentContentBlocks.push(toolBlock);
+
+          res.write(
+            `event: content_block_start\ndata: ${JSON.stringify(
+              toolBlockStart
+            )}\n\n`
+          );
+          toolUseJson = "";
+        }
+
+        // Stream tool call JSON
+        if (toolCall.function?.arguments) {
+          const jsonDelta: MessageEvent = {
+            type: "content_block_delta",
+            index: contentBlockIndex,
+            delta: {
+              type: "input_json_delta",
+              partial_json: toolCall.function?.arguments,
+            },
+          };
+
+          toolUseJson += toolCall.function.arguments;
+
+          try {
+            const parsedJson = JSON.parse(toolUseJson);
+            currentContentBlocks[contentBlockIndex].input = parsedJson;
+          } catch (e) {
+            // JSON not yet complete, continue accumulating
+          }
+
+          res.write(
+            `event: content_block_delta\ndata: ${JSON.stringify(jsonDelta)}\n\n`
+          );
+        }
+      } else if (delta.content) {
+        // Handle regular text content
+        if (isToolUse) {
+          // End previous tool call block
+          const contentBlockStop: MessageEvent = {
+            type: "content_block_stop",
+            index: contentBlockIndex,
+          };
+
+          res.write(
+            `event: content_block_stop\ndata: ${JSON.stringify(
+              contentBlockStop
+            )}\n\n`
+          );
+          contentBlockIndex++;
+          isToolUse = false;
+        }
+
+        if (!delta.content) continue;
+
+        // If text block not yet started, send content_block_start
+        if (!hasStartedTextBlock) {
+          const textBlock: ContentBlock = {
+            type: "text",
+            text: "",
+          };
+
+          const textBlockStart: MessageEvent = {
+            type: "content_block_start",
+            index: contentBlockIndex,
+            content_block: textBlock,
+          };
+
+          currentContentBlocks.push(textBlock);
+
+          res.write(
+            `event: content_block_start\ndata: ${JSON.stringify(
+              textBlockStart
+            )}\n\n`
+          );
+          hasStartedTextBlock = true;
+        }
+
+        // Send regular text content
+        const contentDelta: MessageEvent = {
+          type: "content_block_delta",
+          index: contentBlockIndex,
+          delta: {
+            type: "text_delta",
+            text: delta.content,
+          },
+        };
+
+        // Update content block text
+        if (currentContentBlocks[contentBlockIndex]) {
+          currentContentBlocks[contentBlockIndex].text += delta.content;
+        }
+
+        res.write(
+          `event: content_block_delta\ndata: ${JSON.stringify(
+            contentDelta
+          )}\n\n`
+        );
+      }
+    }
+  } catch (e: any) {
+    // If text block not yet started, send content_block_start
+    if (!hasStartedTextBlock) {
+      const textBlock: ContentBlock = {
+        type: "text",
+        text: "",
+      };
+
+      const textBlockStart: MessageEvent = {
+        type: "content_block_start",
+        index: contentBlockIndex,
+        content_block: textBlock,
+      };
+
+      currentContentBlocks.push(textBlock);
+
+      res.write(
+        `event: content_block_start\ndata: ${JSON.stringify(
+          textBlockStart
+        )}\n\n`
+      );
+      hasStartedTextBlock = true;
+    }
+
+    // Send regular text content
+    const contentDelta: MessageEvent = {
+      type: "content_block_delta",
+      index: contentBlockIndex,
+      delta: {
+        type: "text_delta",
+        text: JSON.stringify(e),
+      },
+    };
+
+    // Update content block text
+    if (currentContentBlocks[contentBlockIndex]) {
+      currentContentBlocks[contentBlockIndex].text += JSON.stringify(e);
+    }
+
+    res.write(
+      `event: content_block_delta\ndata: ${JSON.stringify(contentDelta)}\n\n`
+    );
+  }
+
+  // Close last content block
+  const contentBlockStop: MessageEvent = {
+    type: "content_block_stop",
+    index: contentBlockIndex,
+  };
+
+  res.write(
+    `event: content_block_stop\ndata: ${JSON.stringify(contentBlockStop)}\n\n`
+  );
+
+  // Send message_delta event with appropriate stop_reason
+  const messageDelta: MessageEvent = {
+    type: "message_delta",
+    delta: {
+      stop_reason: isToolUse ? "tool_use" : "end_turn",
+      stop_sequence: null,
+      content: currentContentBlocks,
+    },
+    usage: { input_tokens: 100, output_tokens: 150 },
+  };
+
+  res.write(`event: message_delta\ndata: ${JSON.stringify(messageDelta)}\n\n`);
+
+  // Send message_stop event
+  const messageStop: MessageEvent = {
+    type: "message_stop",
+  };
+
+  res.write(`event: message_stop\ndata: ${JSON.stringify(messageStop)}\n\n`);
+  res.end();
+}
--- a/tsconfig.json
+++ b/tsconfig.json
@@ -0,0 +1,20 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "CommonJS",
+    "outDir": "./dist",
+    "rootDir": "./src",
+    "strict": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "forceConsistentCasingInFileNames": true,
+    "resolveJsonModule": true,
+    "moduleResolution": "node",
+    "noImplicitAny": true,
+    "allowSyntheticDefaultImports": true,
+    "sourceMap": true,
+    "declaration": true
+  },
+  "include": ["src/**/*.ts"],
+  "exclude": ["node_modules", "dist"]
+}
--- a/utils.mjs
+++ b/utils.mjs
@@ -1,9 +0,0 @@
-import { HttpsProxyAgent } from "https-proxy-agent";
-
-export function getOpenAICommonOptions() {
-  const options = {};
-  if (process.env.PROXY_URL) {
-    options.httpAgent = new HttpsProxyAgent(process.env.PROXY_URL);
-  }
-  return options;
-}