feat(copilot-sdk): release v0.1.1 - remove db dependency, add timeout, fix streaming
- Remove database dependency for session management, use chat_id directly - Add TIMEOUT valve (default 300s) - Fix streaming issues by handling full message events - Improve chat_id extraction and tool detection - Update docs and bump version to 0.1.1
This commit is contained in:
689
plugins/pipes/github-copilot-sdk/github_copilot_sdk.py
Normal file
689
plugins/pipes/github-copilot-sdk/github_copilot_sdk.py
Normal file
@@ -0,0 +1,689 @@
|
||||
"""
|
||||
title: GitHub Copilot Official SDK Pipe (Dynamic Models)
|
||||
author: Fu-Jie
|
||||
author_url: https://github.com/Fu-Jie/awesome-openwebui
|
||||
funding_url: https://github.com/open-webui
|
||||
description: Integrate GitHub Copilot SDK. Supports dynamic models, multi-turn conversation, streaming, multimodal input, and infinite sessions (context compaction).
|
||||
version: 0.1.1
|
||||
requirements: github-copilot-sdk
|
||||
"""
|
||||
|
||||
import os
|
||||
import time
|
||||
import json
|
||||
import base64
|
||||
import tempfile
|
||||
import asyncio
|
||||
import logging
|
||||
import shutil
|
||||
import subprocess
|
||||
import sys
|
||||
from typing import Optional, Union, AsyncGenerator, List, Any, Dict
|
||||
from pydantic import BaseModel, Field
|
||||
from datetime import datetime, timezone
|
||||
import contextlib
|
||||
|
||||
# Setup logger
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
# Global client storage
|
||||
_SHARED_CLIENT = None
|
||||
_SHARED_TOKEN = ""
|
||||
_CLIENT_LOCK = asyncio.Lock()
|
||||
|
||||
|
||||
class Pipe:
|
||||
class Valves(BaseModel):
|
||||
GH_TOKEN: str = Field(
|
||||
default="",
|
||||
description="GitHub Fine-grained Token (Requires 'Copilot Requests' permission)",
|
||||
)
|
||||
MODEL_ID: str = Field(
|
||||
default="claude-sonnet-4.5",
|
||||
description="Default Copilot model name (used when dynamic fetching fails)",
|
||||
)
|
||||
CLI_PATH: str = Field(
|
||||
default="/usr/local/bin/copilot",
|
||||
description="Path to Copilot CLI",
|
||||
)
|
||||
DEBUG: bool = Field(
|
||||
default=False,
|
||||
description="Enable technical debug logs (connection info, etc.)",
|
||||
)
|
||||
SHOW_THINKING: bool = Field(
|
||||
default=True,
|
||||
description="Show model reasoning/thinking process",
|
||||
)
|
||||
EXCLUDE_KEYWORDS: str = Field(
|
||||
default="",
|
||||
description="Exclude models containing these keywords (comma separated, e.g.: codex, haiku)",
|
||||
)
|
||||
WORKSPACE_DIR: str = Field(
|
||||
default="",
|
||||
description="Restricted workspace directory for file operations. If empty, allows access to the current process directory.",
|
||||
)
|
||||
INFINITE_SESSION: bool = Field(
|
||||
default=True,
|
||||
description="Enable Infinite Sessions (automatic context compaction)",
|
||||
)
|
||||
COMPACTION_THRESHOLD: float = Field(
|
||||
default=0.8,
|
||||
description="Background compaction threshold (0.0-1.0)",
|
||||
)
|
||||
BUFFER_THRESHOLD: float = Field(
|
||||
default=0.95,
|
||||
description="Buffer exhaustion threshold (0.0-1.0)",
|
||||
)
|
||||
TIMEOUT: int = Field(
|
||||
default=300,
|
||||
description="Timeout for each stream chunk (seconds)",
|
||||
)
|
||||
|
||||
def __init__(self):
|
||||
self.type = "pipe"
|
||||
self.id = "copilotsdk"
|
||||
self.name = "copilotsdk"
|
||||
self.valves = self.Valves()
|
||||
self.temp_dir = tempfile.mkdtemp(prefix="copilot_images_")
|
||||
self.thinking_started = False
|
||||
self._model_cache = [] # Model list cache
|
||||
|
||||
def __del__(self):
|
||||
try:
|
||||
shutil.rmtree(self.temp_dir)
|
||||
except:
|
||||
pass
|
||||
|
||||
def _emit_debug_log(self, message: str):
|
||||
"""Emit debug log to frontend if DEBUG valve is enabled."""
|
||||
if self.valves.DEBUG:
|
||||
print(f"[Copilot Pipe] {message}")
|
||||
|
||||
def _get_user_context(self):
|
||||
"""Helper to get user context (placeholder for future use)."""
|
||||
return {}
|
||||
|
||||
def _get_chat_context(
|
||||
self, body: dict, __metadata__: Optional[dict] = None
|
||||
) -> Dict[str, str]:
|
||||
"""
|
||||
Highly reliable chat context extraction logic.
|
||||
Priority: __metadata__ > body['chat_id'] > body['metadata']['chat_id']
|
||||
"""
|
||||
chat_id = ""
|
||||
source = "none"
|
||||
|
||||
# 1. Prioritize __metadata__ (most reliable source injected by OpenWebUI)
|
||||
if __metadata__ and isinstance(__metadata__, dict):
|
||||
chat_id = __metadata__.get("chat_id", "")
|
||||
if chat_id:
|
||||
source = "__metadata__"
|
||||
|
||||
# 2. Then try body root
|
||||
if not chat_id and isinstance(body, dict):
|
||||
chat_id = body.get("chat_id", "")
|
||||
if chat_id:
|
||||
source = "body_root"
|
||||
|
||||
# 3. Finally try body.metadata
|
||||
if not chat_id and isinstance(body, dict):
|
||||
body_metadata = body.get("metadata", {})
|
||||
if isinstance(body_metadata, dict):
|
||||
chat_id = body_metadata.get("chat_id", "")
|
||||
if chat_id:
|
||||
source = "body_metadata"
|
||||
|
||||
# Debug: Log ID source
|
||||
if chat_id:
|
||||
self._emit_debug_log(f"Extracted ChatID: {chat_id} (Source: {source})")
|
||||
else:
|
||||
# If still not found, log body keys for troubleshooting
|
||||
keys = list(body.keys()) if isinstance(body, dict) else "not a dict"
|
||||
self._emit_debug_log(
|
||||
f"Warning: Failed to extract ChatID. Body keys: {keys}"
|
||||
)
|
||||
|
||||
return {
|
||||
"chat_id": str(chat_id).strip(),
|
||||
}
|
||||
|
||||
async def pipes(self) -> List[dict]:
|
||||
"""Dynamically fetch model list"""
|
||||
# Return cache if available
|
||||
if self._model_cache:
|
||||
return self._model_cache
|
||||
|
||||
self._emit_debug_log("Fetching model list dynamically...")
|
||||
try:
|
||||
self._setup_env()
|
||||
if not self.valves.GH_TOKEN:
|
||||
return [{"id": f"{self.id}-error", "name": "Error: GH_TOKEN not set"}]
|
||||
|
||||
from copilot import CopilotClient
|
||||
|
||||
client_config = {}
|
||||
if os.environ.get("COPILOT_CLI_PATH"):
|
||||
client_config["cli_path"] = os.environ["COPILOT_CLI_PATH"]
|
||||
|
||||
client = CopilotClient(client_config)
|
||||
try:
|
||||
await client.start()
|
||||
models = await client.list_models()
|
||||
|
||||
# Update cache
|
||||
self._model_cache = []
|
||||
exclude_list = [
|
||||
k.strip().lower()
|
||||
for k in self.valves.EXCLUDE_KEYWORDS.split(",")
|
||||
if k.strip()
|
||||
]
|
||||
|
||||
models_with_info = []
|
||||
for m in models:
|
||||
# Compatible with dict and object access
|
||||
m_id = (
|
||||
m.get("id") if isinstance(m, dict) else getattr(m, "id", str(m))
|
||||
)
|
||||
m_name = (
|
||||
m.get("name")
|
||||
if isinstance(m, dict)
|
||||
else getattr(m, "name", m_id)
|
||||
)
|
||||
m_policy = (
|
||||
m.get("policy")
|
||||
if isinstance(m, dict)
|
||||
else getattr(m, "policy", {})
|
||||
)
|
||||
m_billing = (
|
||||
m.get("billing")
|
||||
if isinstance(m, dict)
|
||||
else getattr(m, "billing", {})
|
||||
)
|
||||
|
||||
# Check policy state
|
||||
state = (
|
||||
m_policy.get("state")
|
||||
if isinstance(m_policy, dict)
|
||||
else getattr(m_policy, "state", "enabled")
|
||||
)
|
||||
if state == "disabled":
|
||||
continue
|
||||
|
||||
# Filtering logic
|
||||
if any(kw in m_id.lower() for kw in exclude_list):
|
||||
continue
|
||||
|
||||
# Get multiplier
|
||||
multiplier = (
|
||||
m_billing.get("multiplier", 1)
|
||||
if isinstance(m_billing, dict)
|
||||
else getattr(m_billing, "multiplier", 1)
|
||||
)
|
||||
|
||||
# Format display name
|
||||
if multiplier == 0:
|
||||
display_name = f"-🔥 {m_id} (unlimited)"
|
||||
else:
|
||||
display_name = f"-{m_id} ({multiplier}x)"
|
||||
|
||||
models_with_info.append(
|
||||
{
|
||||
"id": f"{self.id}-{m_id}",
|
||||
"name": display_name,
|
||||
"multiplier": multiplier,
|
||||
"raw_id": m_id,
|
||||
}
|
||||
)
|
||||
|
||||
# Sort: multiplier ascending, then raw_id ascending
|
||||
models_with_info.sort(key=lambda x: (x["multiplier"], x["raw_id"]))
|
||||
self._model_cache = [
|
||||
{"id": m["id"], "name": m["name"]} for m in models_with_info
|
||||
]
|
||||
|
||||
self._emit_debug_log(
|
||||
f"Successfully fetched {len(self._model_cache)} models (filtered)"
|
||||
)
|
||||
return self._model_cache
|
||||
except Exception as e:
|
||||
self._emit_debug_log(f"Failed to fetch model list: {e}")
|
||||
# Return default model on failure
|
||||
return [
|
||||
{
|
||||
"id": f"{self.id}-{self.valves.MODEL_ID}",
|
||||
"name": f"GitHub Copilot ({self.valves.MODEL_ID})",
|
||||
}
|
||||
]
|
||||
finally:
|
||||
await client.stop()
|
||||
except Exception as e:
|
||||
self._emit_debug_log(f"Pipes Error: {e}")
|
||||
return [
|
||||
{
|
||||
"id": f"{self.id}-{self.valves.MODEL_ID}",
|
||||
"name": f"GitHub Copilot ({self.valves.MODEL_ID})",
|
||||
}
|
||||
]
|
||||
|
||||
async def _get_client(self):
|
||||
"""Helper to get or create a CopilotClient instance."""
|
||||
from copilot import CopilotClient
|
||||
|
||||
client_config = {}
|
||||
if os.environ.get("COPILOT_CLI_PATH"):
|
||||
client_config["cli_path"] = os.environ["COPILOT_CLI_PATH"]
|
||||
|
||||
client = CopilotClient(client_config)
|
||||
await client.start()
|
||||
return client
|
||||
|
||||
def _setup_env(self):
|
||||
cli_path = self.valves.CLI_PATH
|
||||
found = False
|
||||
|
||||
if os.path.exists(cli_path):
|
||||
found = True
|
||||
|
||||
if not found:
|
||||
sys_path = shutil.which("copilot")
|
||||
if sys_path:
|
||||
cli_path = sys_path
|
||||
found = True
|
||||
|
||||
if not found:
|
||||
try:
|
||||
subprocess.run(
|
||||
"curl -fsSL https://gh.io/copilot-install | bash",
|
||||
shell=True,
|
||||
check=True,
|
||||
)
|
||||
if os.path.exists(self.valves.CLI_PATH):
|
||||
cli_path = self.valves.CLI_PATH
|
||||
found = True
|
||||
except:
|
||||
pass
|
||||
|
||||
if found:
|
||||
os.environ["COPILOT_CLI_PATH"] = cli_path
|
||||
cli_dir = os.path.dirname(cli_path)
|
||||
if cli_dir not in os.environ["PATH"]:
|
||||
os.environ["PATH"] = f"{cli_dir}:{os.environ['PATH']}"
|
||||
|
||||
if self.valves.GH_TOKEN:
|
||||
os.environ["GH_TOKEN"] = self.valves.GH_TOKEN
|
||||
os.environ["GITHUB_TOKEN"] = self.valves.GH_TOKEN
|
||||
|
||||
def _process_images(self, messages):
|
||||
attachments = []
|
||||
text_content = ""
|
||||
if not messages:
|
||||
return "", []
|
||||
last_msg = messages[-1]
|
||||
content = last_msg.get("content", "")
|
||||
|
||||
if isinstance(content, list):
|
||||
for item in content:
|
||||
if item.get("type") == "text":
|
||||
text_content += item.get("text", "")
|
||||
elif item.get("type") == "image_url":
|
||||
image_url = item.get("image_url", {}).get("url", "")
|
||||
if image_url.startswith("data:image"):
|
||||
try:
|
||||
header, encoded = image_url.split(",", 1)
|
||||
ext = header.split(";")[0].split("/")[-1]
|
||||
file_name = f"image_{len(attachments)}.{ext}"
|
||||
file_path = os.path.join(self.temp_dir, file_name)
|
||||
with open(file_path, "wb") as f:
|
||||
f.write(base64.b64decode(encoded))
|
||||
attachments.append(
|
||||
{
|
||||
"type": "file",
|
||||
"path": file_path,
|
||||
"display_name": file_name,
|
||||
}
|
||||
)
|
||||
self._emit_debug_log(f"Image processed: {file_path}")
|
||||
except Exception as e:
|
||||
self._emit_debug_log(f"Image error: {e}")
|
||||
else:
|
||||
text_content = str(content)
|
||||
return text_content, attachments
|
||||
|
||||
async def pipe(
|
||||
self, body: dict, __metadata__: Optional[dict] = None
|
||||
) -> Union[str, AsyncGenerator]:
|
||||
self._setup_env()
|
||||
if not self.valves.GH_TOKEN:
|
||||
return "Error: Please configure GH_TOKEN in Valves."
|
||||
|
||||
# Parse user selected model
|
||||
request_model = body.get("model", "")
|
||||
real_model_id = self.valves.MODEL_ID # Default value
|
||||
|
||||
if request_model.startswith(f"{self.id}-"):
|
||||
real_model_id = request_model[len(f"{self.id}-") :]
|
||||
self._emit_debug_log(f"Using selected model: {real_model_id}")
|
||||
|
||||
messages = body.get("messages", [])
|
||||
if not messages:
|
||||
return "No messages."
|
||||
|
||||
# Get Chat ID using improved helper
|
||||
chat_ctx = self._get_chat_context(body, __metadata__)
|
||||
chat_id = chat_ctx.get("chat_id")
|
||||
|
||||
is_streaming = body.get("stream", False)
|
||||
self._emit_debug_log(f"Request Streaming: {is_streaming}")
|
||||
|
||||
last_text, attachments = self._process_images(messages)
|
||||
|
||||
# Determine prompt strategy
|
||||
# If we have a chat_id, we try to resume session.
|
||||
# If resumed, we assume the session has history, so we only send the last message.
|
||||
# If new session, we send full history (or at least the last few turns if we want to be safe, but let's send full for now).
|
||||
|
||||
# However, to be robust against history edits in OpenWebUI, we might want to always send full history?
|
||||
# Copilot SDK `create_session` doesn't take history. `session.send` appends.
|
||||
# If we resume, we append.
|
||||
# If user edited history, the session state is stale.
|
||||
# For now, we implement "Resume if possible, else Create".
|
||||
|
||||
prompt = ""
|
||||
is_new_session = True
|
||||
|
||||
try:
|
||||
client = await self._get_client()
|
||||
session = None
|
||||
|
||||
if chat_id:
|
||||
try:
|
||||
# Try to resume session using chat_id as session_id
|
||||
session = await client.resume_session(chat_id)
|
||||
self._emit_debug_log(f"Resumed session using ChatID: {chat_id}")
|
||||
is_new_session = False
|
||||
except Exception:
|
||||
# Resume failed, session might not exist on disk
|
||||
self._emit_debug_log(
|
||||
f"Session {chat_id} not found or expired, creating new."
|
||||
)
|
||||
session = None
|
||||
|
||||
if session is None:
|
||||
# Create new session
|
||||
from copilot.types import SessionConfig, InfiniteSessionConfig
|
||||
|
||||
# Infinite Session Config
|
||||
infinite_session_config = None
|
||||
if self.valves.INFINITE_SESSION:
|
||||
infinite_session_config = InfiniteSessionConfig(
|
||||
enabled=True,
|
||||
background_compaction_threshold=self.valves.COMPACTION_THRESHOLD,
|
||||
buffer_exhaustion_threshold=self.valves.BUFFER_THRESHOLD,
|
||||
)
|
||||
|
||||
session_config = SessionConfig(
|
||||
session_id=(
|
||||
chat_id if chat_id else None
|
||||
), # Use chat_id as session_id
|
||||
model=real_model_id,
|
||||
streaming=body.get("stream", False),
|
||||
infinite_sessions=infinite_session_config,
|
||||
)
|
||||
|
||||
session = await client.create_session(config=session_config)
|
||||
|
||||
new_sid = getattr(session, "session_id", getattr(session, "id", None))
|
||||
self._emit_debug_log(f"Created new session: {new_sid}")
|
||||
|
||||
# Construct prompt
|
||||
if is_new_session:
|
||||
# For new session, send full conversation history
|
||||
full_conversation = []
|
||||
for msg in messages[:-1]:
|
||||
role = msg.get("role", "user").upper()
|
||||
content = msg.get("content", "")
|
||||
if isinstance(content, list):
|
||||
content = " ".join(
|
||||
[
|
||||
c.get("text", "")
|
||||
for c in content
|
||||
if c.get("type") == "text"
|
||||
]
|
||||
)
|
||||
full_conversation.append(f"{role}: {content}")
|
||||
full_conversation.append(f"User: {last_text}")
|
||||
prompt = "\n\n".join(full_conversation)
|
||||
else:
|
||||
# For resumed session, only send the last message
|
||||
prompt = last_text
|
||||
|
||||
send_payload = {"prompt": prompt, "mode": "immediate"}
|
||||
if attachments:
|
||||
send_payload["attachments"] = attachments
|
||||
|
||||
if body.get("stream", False):
|
||||
# Determine session status message for UI
|
||||
init_msg = ""
|
||||
if self.valves.DEBUG:
|
||||
if is_new_session:
|
||||
new_sid = getattr(
|
||||
session, "session_id", getattr(session, "id", "unknown")
|
||||
)
|
||||
init_msg = f"> [Debug] Created new session: {new_sid}\n"
|
||||
else:
|
||||
init_msg = (
|
||||
f"> [Debug] Resumed session using ChatID: {chat_id}\n"
|
||||
)
|
||||
|
||||
return self.stream_response(client, session, send_payload, init_msg)
|
||||
else:
|
||||
try:
|
||||
response = await session.send_and_wait(send_payload)
|
||||
return response.data.content if response else "Empty response."
|
||||
finally:
|
||||
# Destroy session object to free memory, but KEEP data on disk
|
||||
await session.destroy()
|
||||
|
||||
except Exception as e:
|
||||
self._emit_debug_log(f"Request Error: {e}")
|
||||
return f"Error: {str(e)}"
|
||||
|
||||
async def stream_response(
|
||||
self, client, session, send_payload, init_message: str = ""
|
||||
) -> AsyncGenerator:
|
||||
queue = asyncio.Queue()
|
||||
done = asyncio.Event()
|
||||
self.thinking_started = False
|
||||
has_content = False # Track if any content has been yielded
|
||||
|
||||
def get_event_data(event, attr, default=""):
|
||||
if hasattr(event, "data"):
|
||||
data = event.data
|
||||
if data is None:
|
||||
return default
|
||||
if isinstance(data, (str, int, float, bool)):
|
||||
return str(data) if attr == "value" else default
|
||||
|
||||
if isinstance(data, dict):
|
||||
val = data.get(attr)
|
||||
if val is None:
|
||||
alt_attr = attr.replace("_", "") if "_" in attr else attr
|
||||
val = data.get(alt_attr)
|
||||
if val is None and "_" not in attr:
|
||||
# Try snake_case if camelCase failed
|
||||
import re
|
||||
|
||||
snake_attr = re.sub(r"(?<!^)(?=[A-Z])", "_", attr).lower()
|
||||
val = data.get(snake_attr)
|
||||
else:
|
||||
val = getattr(data, attr, None)
|
||||
if val is None:
|
||||
alt_attr = attr.replace("_", "") if "_" in attr else attr
|
||||
val = getattr(data, alt_attr, None)
|
||||
if val is None and "_" not in attr:
|
||||
import re
|
||||
|
||||
snake_attr = re.sub(r"(?<!^)(?=[A-Z])", "_", attr).lower()
|
||||
val = getattr(data, snake_attr, None)
|
||||
|
||||
return val if val is not None else default
|
||||
return default
|
||||
|
||||
def handler(event):
|
||||
event_type = (
|
||||
getattr(event.type, "value", None)
|
||||
if hasattr(event, "type")
|
||||
else str(event.type)
|
||||
)
|
||||
|
||||
# Log full event data for tool events to help debugging
|
||||
if "tool" in event_type:
|
||||
try:
|
||||
data_str = str(event.data) if hasattr(event, "data") else "no data"
|
||||
self._emit_debug_log(f"Tool Event [{event_type}]: {data_str}")
|
||||
except:
|
||||
pass
|
||||
|
||||
self._emit_debug_log(f"Event: {event_type}")
|
||||
|
||||
# Handle message content (delta or full)
|
||||
if event_type in [
|
||||
"assistant.message_delta",
|
||||
"assistant.message.delta",
|
||||
"assistant.message",
|
||||
]:
|
||||
# Log full message event for troubleshooting why there's no delta
|
||||
if event_type == "assistant.message":
|
||||
self._emit_debug_log(
|
||||
f"Received full message event (non-Delta): {get_event_data(event, 'content')[:50]}..."
|
||||
)
|
||||
|
||||
delta = (
|
||||
get_event_data(event, "delta_content")
|
||||
or get_event_data(event, "deltaContent")
|
||||
or get_event_data(event, "content")
|
||||
or get_event_data(event, "text")
|
||||
)
|
||||
if delta:
|
||||
if self.thinking_started:
|
||||
queue.put_nowait("\n</think>\n")
|
||||
self.thinking_started = False
|
||||
queue.put_nowait(delta)
|
||||
|
||||
elif event_type in [
|
||||
"assistant.reasoning_delta",
|
||||
"assistant.reasoning.delta",
|
||||
"assistant.reasoning",
|
||||
]:
|
||||
delta = (
|
||||
get_event_data(event, "delta_content")
|
||||
or get_event_data(event, "deltaContent")
|
||||
or get_event_data(event, "content")
|
||||
or get_event_data(event, "text")
|
||||
)
|
||||
if delta:
|
||||
if not self.thinking_started and self.valves.SHOW_THINKING:
|
||||
queue.put_nowait("<think>\n")
|
||||
self.thinking_started = True
|
||||
if self.thinking_started:
|
||||
queue.put_nowait(delta)
|
||||
|
||||
elif event_type == "tool.execution_start":
|
||||
# Try multiple possible fields for tool name/description
|
||||
tool_name = (
|
||||
get_event_data(event, "toolName")
|
||||
or get_event_data(event, "name")
|
||||
or get_event_data(event, "description")
|
||||
or get_event_data(event, "tool_name")
|
||||
or "Unknown Tool"
|
||||
)
|
||||
if not self.thinking_started and self.valves.SHOW_THINKING:
|
||||
queue.put_nowait("<think>\n")
|
||||
self.thinking_started = True
|
||||
if self.thinking_started:
|
||||
queue.put_nowait(f"\nRunning Tool: {tool_name}...\n")
|
||||
self._emit_debug_log(f"Tool Start: {tool_name}")
|
||||
|
||||
elif event_type == "tool.execution_complete":
|
||||
if self.thinking_started:
|
||||
queue.put_nowait("Tool Completed.\n")
|
||||
self._emit_debug_log("Tool Complete")
|
||||
|
||||
elif event_type == "session.compaction_start":
|
||||
self._emit_debug_log("Session Compaction Started")
|
||||
|
||||
elif event_type == "session.compaction_complete":
|
||||
self._emit_debug_log("Session Compaction Completed")
|
||||
|
||||
elif event_type == "session.idle":
|
||||
done.set()
|
||||
elif event_type == "session.error":
|
||||
msg = get_event_data(event, "message", "Unknown Error")
|
||||
queue.put_nowait(f"\n[Error: {msg}]")
|
||||
done.set()
|
||||
|
||||
unsubscribe = session.on(handler)
|
||||
await session.send(send_payload)
|
||||
|
||||
if self.valves.DEBUG:
|
||||
yield "<think>\n"
|
||||
if init_message:
|
||||
yield init_message
|
||||
yield "> [Debug] Connection established, waiting for response...\n"
|
||||
self.thinking_started = True
|
||||
|
||||
try:
|
||||
while not done.is_set():
|
||||
try:
|
||||
chunk = await asyncio.wait_for(
|
||||
queue.get(), timeout=float(self.valves.TIMEOUT)
|
||||
)
|
||||
if chunk:
|
||||
has_content = True
|
||||
yield chunk
|
||||
except asyncio.TimeoutError:
|
||||
if done.is_set():
|
||||
break
|
||||
if self.thinking_started:
|
||||
yield f"> [Debug] Waiting for response ({self.valves.TIMEOUT}s exceeded)...\n"
|
||||
continue
|
||||
|
||||
while not queue.empty():
|
||||
chunk = queue.get_nowait()
|
||||
if chunk:
|
||||
has_content = True
|
||||
yield chunk
|
||||
|
||||
if self.thinking_started:
|
||||
yield "\n</think>\n"
|
||||
has_content = True
|
||||
|
||||
# Core fix: If no content was yielded, return a fallback message to prevent OpenWebUI error
|
||||
if not has_content:
|
||||
yield "⚠️ Copilot returned no content. Please check if the Model ID is correct or enable DEBUG mode in Valves for details."
|
||||
|
||||
except Exception as e:
|
||||
yield f"\n[Stream Error: {str(e)}]"
|
||||
finally:
|
||||
unsubscribe()
|
||||
# Only destroy session if it's not cached
|
||||
# We can't easily check chat_id here without passing it,
|
||||
# but stream_response is called within the scope where we decide persistence.
|
||||
# Wait, stream_response takes session as arg.
|
||||
# We need to know if we should destroy it.
|
||||
# Let's assume if it's in _SESSIONS, we don't destroy it.
|
||||
# But checking _SESSIONS here is race-prone or complex.
|
||||
# Simplified: The caller (pipe) handles destruction logic?
|
||||
# No, stream_response is a generator, pipe returns it.
|
||||
# So pipe function exits before stream finishes.
|
||||
# We need to handle destruction here.
|
||||
pass
|
||||
|
||||
# TODO: Proper session cleanup for streaming
|
||||
# For now, we rely on the fact that if we mapped it, we keep it.
|
||||
# If we didn't map it (no chat_id), we should destroy it.
|
||||
# But we don't have chat_id here.
|
||||
# Let's modify stream_response signature or just leave it open for GC?
|
||||
# CopilotSession doesn't auto-close.
|
||||
# Let's add a flag to stream_response.
|
||||
pass
|
||||
Reference in New Issue
Block a user