支持ghcproxy

fix: 修复 Dockerfile 中的启动命令路径
将 CMD 从 'uvicorn main:app' 修改为 'uvicorn app.main:app'，以匹配实际的应用入口文件位置 (app/main.py)。 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
2026-01-12 14:12:15 +08:00 · 2025-12-31 16:05:36 +00:00 · 2025-12-31 15:30:00 +00:00 · 2025-12-31 15:22:40 +00:00 · 2025-12-31 14:20:20 +00:00
9 changed files with 1539 additions and 10 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -133,3 +133,6 @@ dmypy.json

 # Cython debug symbols
 cython_debug/
+
+# logs
+logs/
--- a/11
+++ b/11
@@ -0,0 +1,11 @@
+FROM hub.rat.dev/library/python:3.10-alpine
+
+WORKDIR /app
+
+COPY requirements.txt .
+
+RUN pip install --no-cache-dir -i https://pypi.tuna.tsinghua.edu.cn/simple -r requirements.txt
+
+COPY . .
+
+CMD ["uvicorn", "app.ghcproxy:app", "--host", "0.0.0.0", "--port", "8000"]
--- a/app/ghcproxy.py
+++ b/app/ghcproxy.py
@@ -0,0 +1,285 @@
+import os
+import json
+import random
+import time
+from typing import Optional, Dict, Any
+from datetime import datetime
+
+import httpx
+from fastapi import FastAPI, Request, HTTPException
+from fastapi.responses import StreamingResponse, JSONResponse
+import uvicorn
+
+app = FastAPI()
+
+TOKEN_EXPIRY_THRESHOLD = 60
+GITHUB_TOKEN = "ghu_kpJkheogXW18PMY0Eu6D0sL4r5bDsD3aS3EA" # 注意：硬编码令牌存在安全风险
+GITHUB_API_URL = "https://api.github.com/copilot_internal/v2/token"
+
+cached_token: Optional[Dict[str, Any]] = None
+
+
+def generate_uuid() -> str:
+    template = 'xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx'
+    return ''.join(
+        random.choice('0123456789abcdef') if c == 'x' else random.choice('89ab')
+        for c in template
+    )
+
+
+def is_token_valid(token_data: Optional[Dict[str, Any]]) -> bool:
+    if not token_data or 'token' not in token_data or 'expires_at' not in token_data:
+        return False
+
+    current_time = int(time.time())
+    if current_time + TOKEN_EXPIRY_THRESHOLD >= token_data['expires_at']:
+        return False
+
+    return True
+
+
+async def get_copilot_token() -> Dict[str, Any]:
+    global cached_token
+
+    if cached_token and is_token_valid(cached_token):
+        return cached_token
+
+    headers = {
+        "Authorization": f"Bearer {GITHUB_TOKEN}",
+        "Editor-Version": "JetBrains-IU/252.26830.84",
+        "Editor-Plugin-Version": "copilot-intellij/1.5.58-243",
+        "Copilot-Language-Server-Version": "1.382.0",
+        "X-Github-Api-Version": "2024-12-15",
+        "User-Agent": "GithubCopilot/1.382.0",
+        "Accept": "*/*",
+    }
+
+    async with httpx.AsyncClient() as client:
+        try:
+            response = await client.get(GITHUB_API_URL, headers=headers, timeout=10.0)
+
+            if response.status_code != 200:
+                if cached_token:
+                    return cached_token
+                raise HTTPException(status_code=response.status_code, detail=f"Failed to get token: {response.text}")
+
+            data = response.json()
+            cached_token = data
+
+            expiry_ttl = data['expires_at'] - int(time.time()) - TOKEN_EXPIRY_THRESHOLD
+            if expiry_ttl > 0:
+                print(f"Token cached, will expire in {expiry_ttl} seconds")
+            else:
+                print("Warning: New token has short validity period")
+
+            return data
+
+        except httpx.RequestError as e:
+            if cached_token:
+                return cached_token
+            raise HTTPException(status_code=500, detail=f"Request failed: {str(e)}")
+
+
+def get_headers_for_path(path: str) -> Dict[str, str]:
+    headers = {
+        "Editor-Version": "JetBrains-IU/252.26830.84",
+        "Editor-Plugin-Version": "copilot-intellij/1.5.58-243",
+        "Copilot-Language-Server-Version": "1.382.0",
+        "X-Github-Api-Version": "2025-05-01",
+        "Copilot-Integration-Id": "jetbrains-chat",
+        "User-Agent": "GithubCopilot/1.382.0",
+    }
+
+    if path == "/agents" or path == "/models":
+        return headers
+
+    elif path == "/chat/completions":
+        interaction_id = generate_uuid()
+        request_id = generate_uuid()
+
+        headers.update({
+            "X-Initiator": "user",
+            "X-Interaction-Id": interaction_id,
+            "X-Interaction-Type": "conversation-panel",
+            "Openai-Organization": "github-copilot",
+            "X-Request-Id": request_id,
+            "Vscode-Sessionid": "427689f2-5dad-4b50-95d9-7cca977450061761839746260",
+            "Vscode-Machineid": "c9421c6ac240db1c5bc5117218aa21a73f3762bda7db1702d003ec2df103b812",
+            "Openai-Intent": "conversation-panel",
+            "Copilot-Vision-Request": "true",
+        })
+
+        print(f"/chat/completions path matched, Interaction-Id: {interaction_id}, Request-Id: {request_id}")
+
+    return headers
+
+
+def has_non_empty_content(msg):
+    """检查消息的 content 是否非空"""
+    content = msg.get('content')
+    if content is None:
+        return False
+    if isinstance(content, str):
+        return bool(content.strip()) # 字符串需要去除空格后判断
+    if isinstance(content, (list, dict)):
+        return bool(content) # 列表或字典，非空则为 True
+    # 其他类型 (数字, 布尔值等) 通常视为非空
+    return True
+
+
+def filter_messages_logic(messages):
+    """
+    优化后的过滤逻辑:
+    找到一个 role 为 assistant 且有 tool_calls 的消息 A，
+    以及它后面紧接着的 role 为 tool 的消息 B。
+    删除 A 和 B 之间所有 content 非空的消息。
+    """
+    if not messages or len(messages) < 3: # 至少需要 assistant, something, tool 才能操作
+        return
+
+    i = 0
+    while i < len(messages):
+        current_msg = messages[i]
+
+        # 检查当前消息是否为 assistant 且有 tool_calls (且 tool_calls 非空)
+        is_assistant_with_tool_calls = (
+            current_msg.get("role") == "assistant" and
+            isinstance(current_msg.get("tool_calls"), list) and
+            len(current_msg["tool_calls"]) > 0
+        )
+
+        if is_assistant_with_tool_calls:
+            # 从下一个消息开始查找第一个 role='tool' 的消息
+            j = i + 1
+            found_tool = False
+            indices_to_remove_between = []
+
+            while j < len(messages):
+                msg_to_check = messages[j]
+
+                if msg_to_check.get("role") == "tool":
+                    found_tool = True
+                    break # 找到第一个 tool 就停止，准备删除中间的
+                # 检查 j 位置的消息 (在 assistant 和 tool 之间) 是否有非空 content
+                if has_non_empty_content(msg_to_check):
+                    indices_to_remove_between.append(j)
+                j += 1
+
+            if found_tool and indices_to_remove_between:
+                # 从后往前删除，避免因列表长度变化导致索引失效
+                for idx in sorted(indices_to_remove_between, reverse=True):
+                    removed_msg = messages.pop(idx)
+                    print(f"Removed intermediate message with non-empty content at index {idx}: {removed_msg}")
+                # 删除后，列表变短，下一次循环的 i 应该在当前位置，
+                # 因为原来的 i+1 位置的元素现在移动到了 i。
+                # 所以这里我们不增加 i，让外层循环来处理。
+                continue
+            else:
+                # 如果找到了 assistant 但没有找到配对的 tool，
+                # 或者找到了 tool 但中间没有需要删除的内容，
+                # 都正常检查下一条消息。
+                i += 1
+        else:
+            # 当前消息不符合条件，继续检查下一条
+            i += 1
+
+
+@app.api_route("/v1/{path:path}", methods=["GET", "POST", "PUT", "DELETE", "PATCH"])
+async def proxy_request(request: Request, path: str):
+    # 创建时间戳目录用于存放日志
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S_%f")
+    log_dir = os.path.join("logs", timestamp)
+    os.makedirs(log_dir, exist_ok=True)
+
+    # 记录原始请求数据
+    original_body = await request.body()
+    with open(os.path.join(log_dir, "original_request.txt"), "wb") as f:
+        f.write(original_body or b"")
+
+    token_data = await get_copilot_token()
+    print(token_data)
+    headers = get_headers_for_path(f"/{path}")
+    headers["Authorization"] = f"Bearer {token_data['token']}"
+    headers["hello"] = "world"
+
+    body = original_body
+
+    # 过滤 messages：优化后的逻辑
+    if body:
+        try:
+            body_data = json.loads(body.decode('utf-8') if isinstance(body, bytes) else body)
+            if "messages" in body_data and isinstance(body_data["messages"], list):
+                messages = body_data["messages"]
+                initial_len = len(messages)
+                print(f"Processing messages, initial count: {initial_len}")
+                filter_messages_logic(messages)
+                final_len = len(messages)
+                if initial_len != final_len:
+                    body = json.dumps(body_data).encode('utf-8')
+                    print(f"Messages filtered from {initial_len} to {final_len}.")
+                    # 记录修改后的请求体
+                    with open(os.path.join(log_dir, "modified_request.txt"), "wb") as f:
+                        f.write(body or b"")
+                else:
+                    # 如果没有修改，也记录原始内容作为modified_request
+                    with open(os.path.join(log_dir, "modified_request.txt"), "wb") as f:
+                        f.write(body or b"")
+
+        except json.JSONDecodeError:
+            # body 不是 JSON，保持原样
+            print("Request body is not valid JSON, skipping message filtering.")
+            with open(os.path.join(log_dir, "modified_request.txt"), "wb") as f:
+                f.write(body or b"")
+
+    # target_url = f"https://qwapi.oopsapi.com/v1/{path}"
+    target_url = "https://api.business.githubcopilot.com/" + path
+
+    print(target_url, "   ", str(body))
+
+    # request_headers = {k: v for k, v in request.headers.items()
+    #                   if k.lower() not in ['host', 'content-length']}
+    # request_headers.update(headers)
+    async with httpx.AsyncClient() as client:
+        try:
+            response = await client.request(
+                method=request.method,
+                url=target_url,
+                headers=headers,
+                content=body if body else None,
+                timeout=120.0,
+            )
+
+            content = response.content
+
+            # 记录响应结果
+            with open(os.path.join(log_dir, "response.txt"), "wb") as f:
+                f.write(content or b"")
+
+            print("content: ", content)
+            if response.headers.get("content-type", "").startswith("text/event-stream"):
+                return StreamingResponse(
+                    response.aiter_bytes(),
+                    status_code=response.status_code,
+                    headers=dict(response.headers),
+                )
+
+            return JSONResponse(
+                content=json.loads(content) if content else {},
+                status_code=response.status_code,
+                headers={k: v for k, v in response.headers.items()
+                        if k.lower() not in ['content-length', 'transfer-encoding']}
+            )
+
+        except httpx.RequestError as e:
+            import backtrace
+            backtrace.print_exc()
+            raise HTTPException(status_code=500, detail=f"Proxy request failed: {str(e)}")
+
+
+@app.get("/")
+async def root():
+    return {"message": "GitHub Copilot Proxy API"}
+
+
+if __name__ == "__main__":
+    uvicorn.run(app, host="0.0.0.0", port=8000)
--- a/app/main.py
+++ b/app/main.py
@@ -105,10 +105,12 @@ async def chat_completions(

            # First, collect all chunks to detect if there are tool calls
            async for chunk in stream_llm_api(messages_to_llm, settings, log_id):
+                logger.info(f"sse_result: {chunk}")
                raw_chunks.append(chunk)
                # Extract content from SSE chunks
                parsed = _parse_sse_data(chunk)
-                if parsed and parsed.get("type") != "done":
+                logger.info(f"sse_result_data: {parsed}")
+                if parsed and ( parsed.get("type") != "done" or parsed.get("choices").get("finish_reason") == "stop" ):
                    choices = parsed.get("choices")
                    if choices and len(choices) > 0:
                        delta = choices[0].get("delta")
--- a/app/response_parser.py
+++ b/app/response_parser.py
@@ -125,6 +125,7 @@ class ResponseParser:
        1. Responses with tool calls (wrapped in tags)
        2. Regular text responses
        3. Multiple tool calls in a single response
+        4. Incomplete tool calls (missing closing tag) - fallback parsing

        Args:
            llm_response: The raw text response from the LLM
@@ -152,6 +153,10 @@ class ResponseParser:
            if matches:
                return self._parse_tool_call_response(llm_response, matches)
            else:
+                # Check for incomplete tool call (opening tag without closing tag)
+                if self.tool_call_start_tag in llm_response:
+                    logger.warning("Detected incomplete tool call (missing closing tag). Attempting fallback parsing.")
+                    return self._parse_incomplete_tool_call(llm_response)
                return self._parse_text_only_response(llm_response)

        except Exception as e:
@@ -217,6 +222,55 @@ class ResponseParser:
            tool_calls=tool_calls if tool_calls else None
        )

+    def _parse_incomplete_tool_call(self, llm_response: str) -> ResponseMessage:
+        """
+        Parse a response with an incomplete tool call (missing closing tag).
+
+        This is a fallback method when the LLM doesn't close the tag properly.
+        It attempts to extract the tool call JSON and complete it.
+
+        Args:
+            llm_response: The full LLM response with incomplete tool call
+
+        Returns:
+            ResponseMessage with content and optionally tool_calls
+        """
+        try:
+            # Find the opening tag
+            start_idx = llm_response.find(self.tool_call_start_tag)
+            if start_idx == -1:
+                return self._parse_text_only_response(llm_response)
+
+            # Extract content before the opening tag
+            content_before = llm_response[:start_idx].strip() if start_idx > 0 else None
+
+            # Extract everything after the opening tag
+            after_tag = llm_response[start_idx + len(self.tool_call_start_tag):]
+
+            # Try to extract valid JSON
+            json_str = self._extract_valid_json(after_tag)
+            if json_str:
+                try:
+                    tool_call_data = json.loads(json_str)
+                    tool_call = self._create_tool_call(tool_call_data)
+
+                    logger.info(f"Successfully parsed incomplete tool call: {tool_call.function.name}")
+
+                    return ResponseMessage(
+                        content=content_before,
+                        tool_calls=[tool_call]
+                    )
+                except json.JSONDecodeError as e:
+                    logger.warning(f"Failed to parse JSON from incomplete tool call: {e}")
+
+            # If all else fails, return as text
+            logger.warning("Could not salvage incomplete tool call, returning as text")
+            return ResponseMessage(content=llm_response)
+
+        except Exception as e:
+            logger.warning(f"Error in _parse_incomplete_tool_call: {e}")
+            return ResponseMessage(content=llm_response)
+
    def _parse_text_only_response(self, llm_response: str) -> ResponseMessage:
        """
        Parse a response with no tool calls.
--- a/app/services.py
+++ b/app/services.py
@@ -117,17 +117,33 @@ def inject_tools_into_prompt(messages: List[ChatMessage], tools: List[Tool]) ->

    tool_prompt = f"""
 You are a helpful assistant with access to a set of tools.
-You can call them by emitting a JSON object inside tool call tags.

-IMPORTANT: Use the following format for tool calls:
-Format: {TOOL_CALL_START_TAG}{{"name": "tool_name", "arguments": {{...}}}}{TOOL_CALL_END_TAG}
+## TOOL CALL FORMAT (CRITICAL)

-Example: {full_example}
+When you need to use a tool, you MUST follow this EXACT format:

-Here are the available tools:
+{TOOL_CALL_START_TAG}{{"name": "tool_name", "arguments": {{...}}}}{TOOL_CALL_END_TAG}
+
+### IMPORTANT RULES:
+1. ALWAYS include BOTH the opening tag ({TOOL_CALL_START_TAG}) AND closing tag ({TOOL_CALL_END_TAG})
+2. The JSON must be valid and properly formatted
+3. Keep arguments concise to avoid truncation
+4. Do not include any text between the tags except the JSON
+
+### Examples:
+Simple call:
+{full_example}
+
+Multiple arguments:
+{TOOL_CALL_START_TAG}{{"name": "search", "arguments": {{"query": "example", "limit": 5}}}}{TOOL_CALL_END_TAG}
+
+## AVAILABLE TOOLS:
 {tool_defs}

-Only use the tools if strictly necessary.
+## REMEMBER:
+- If you decide to call a tool, output ONLY the tool call tags (you may add brief text before or after)
+- ALWAYS close your tags properly with {TOOL_CALL_END_TAG}
+- Keep your arguments concise and essential
 """
    # Prepend the system prompt with tool definitions
    return [ChatMessage(role="system", content=tool_prompt)] + messages
@@ -150,7 +166,7 @@ async def _raw_stream_from_llm(messages: List[ChatMessage], settings: Settings,
    Yields raw byte chunks as received.
    """
    headers = { "Authorization": f"Bearer {settings.REAL_LLM_API_KEY}", "Content-Type": "application/json" }
-    payload = { "model": "default-model", "messages": [msg.model_dump() for msg in messages], "stream": True }
+    payload = { "model": "gpt-4.1", "messages": [msg.model_dump() for msg in messages], "stream": True }

    # Log the request payload to the database
    update_request_log(log_id, llm_request=payload)
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -0,0 +1,18 @@
+version: '3.8'
+
+services:
+  sqlite-web:
+    image: docker.1ms.run/coleifer/sqlite-web
+    volumes:
+      -  .:/data
+    environment:
+      SQLITE_DATABASE: llm_proxy.db
+    ports:
+      -  8580:8080
+  llmproxy:
+    build: .
+    ports:
+      - "8000:8000"
+    volumes:
+      - .:/app
+    restart: unless-stopped
--- a/docs/multi_backend_final_design.md
+++ b/docs/multi_backend_final_design.md
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,3 +1,4 @@
+fastapi
+uvicorn[standard]
+httpx
 python-dotenv
-pydantic
-requests
Author	SHA1	Message	Date
yhydev	9b0c32b6f2	支持ghcproxy	2026-01-12 14:12:15 +08:00
Vertex-AI-Step-Builder	03e216373f	fix: 修复 Dockerfile 中的启动命令路径将 CMD 从 'uvicorn main:app' 修改为 'uvicorn app.main:app'，以匹配实际的应用入口文件位置 (app/main.py)。 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>	2025-12-31 16:05:36 +00:00
Vertex-AI-Step-Builder	912b027864	feat: add requirements, Dockerfile and docker-compose	2025-12-31 15:30:00 +00:00
Vertex-AI-Step-Builder	fa419ccac4	多后端支持文档	2025-12-31 15:22:40 +00:00
Vertex-AI-Step-Builder	cecfc74a96	优化提示词及没有工具调用闭合标签	2025-12-31 14:20:20 +00:00