Spaces:

ricebug
/

glm

Paused

App Files Files Community

glm / main.ts

ricebug

Update main.ts

4dd6468 verified 7 months ago

raw

history blame contribute delete

88.6 kB


	/**
	* ZtoApi - OpenAI兼容API代理服务器
	*
	* 功能概述：
	* - 为 Z.ai 的 GLM-4.5 模型提供 OpenAI 兼容的 API 接口
	* - 支持流式和非流式响应模式
	* - 提供实时监控 Dashboard 功能
	* - 支持匿名 token 自动获取
	* - 智能处理模型思考过程展示
	* - 完整的请求统计和错误处理
	*
	* 技术栈：
	* - Deno 原生 HTTP API
	* - TypeScript 类型安全
	* - Server-Sent Events (SSE) 流式传输
	* - 支持 Deno Deploy 和自托管部署
	*
	* @author ZtoApi Team
	* @version 2.0.0
	* @since 2024
	*/
	declare namespace Deno {
	interface Conn {
	readonly rid: number;
	localAddr: Addr;
	remoteAddr: Addr;
	read(p: Uint8Array): Promise<number \| null>;
	write(p: Uint8Array): Promise<number>;
	close(): void;
	}

	interface Addr {
	hostname: string;
	port: number;
	transport: string;
	}

	interface Listener extends AsyncIterable<Conn> {
	readonly addr: Addr;
	accept(): Promise<Conn>;
	close(): void;
	[Symbol.asyncIterator](): AsyncIterableIterator<Conn>;
	}

	interface HttpConn {
	nextRequest(): Promise<RequestEvent \| null>;
	[Symbol.asyncIterator](): AsyncIterableIterator<RequestEvent>;
	}

	interface RequestEvent {
	request: Request;
	respondWith(r: Response \| Promise<Response>): Promise<void>;
	}

	function listen(options: { port: number }): Listener;
	function serveHttp(conn: Conn): HttpConn;
	function serve(handler: (request: Request) => Promise<Response>): void;

	namespace env {
	function get(key: string): string \| undefined;
	}
	}

	/**
	* 请求统计信息接口
	* 用于跟踪API调用的各项指标
	*/
	interface RequestStats {
	totalRequests: number;
	successfulRequests: number;
	failedRequests: number;
	lastRequestTime: Date;
	averageResponseTime: number;
	}

	/**
	* 实时请求信息接口
	* 用于Dashboard显示最近的API请求记录
	*/
	interface LiveRequest {
	id: string;
	timestamp: Date;
	method: string;
	path: string;
	status: number;
	duration: number;
	userAgent: string;
	model?: string;
	}

	/**
	* OpenAI兼容请求结构
	* 标准的聊天完成API请求格式
	*/
	interface OpenAIRequest {
	model: string;
	messages: Message[];
	stream?: boolean;
	temperature?: number;
	max_tokens?: number;
	}

	/**
	* 聊天消息结构
	* 支持全方位多模态内容：文本、图像、视频、文档
	*/
	interface Message {
	role: string;
	content: string \| Array<{
	type: string;
	text?: string;
	image_url?: {url: string};
	video_url?: {url: string};
	document_url?: {url: string};
	audio_url?: {url: string};
	}>;
	}

	/**
	* 上游服务请求结构
	* 向Z.ai服务发送的请求格式
	*/
	interface UpstreamRequest {
	stream: boolean;
	model: string;
	messages: Message[];
	params: Record<string, unknown>;
	features: Record<string, unknown>;
	background_tasks?: Record<string, boolean>;
	chat_id?: string;
	id?: string;
	mcp_servers?: string[];
	model_item?: {
	id: string;
	name: string;
	owned_by: string;
	openai?: any;
	urlIdx?: number;
	info?: any;
	actions?: any[];
	tags?: any[];
	};
	tool_servers?: string[];
	variables?: Record<string, string>;
	}

	/**
	* OpenAI兼容响应结构
	*/
	interface OpenAIResponse {
	id: string;
	object: string;
	created: number;
	model: string;
	choices: Choice[];
	usage?: Usage;
	}

	interface Choice {
	index: number;
	message?: Message;
	delta?: Delta;
	finish_reason?: string;
	}

	interface Delta {
	role?: string;
	content?: string;
	}

	interface Usage {
	prompt_tokens: number;
	completion_tokens: number;
	total_tokens: number;
	}

	/**
	* 上游SSE数据结构
	*/
	interface UpstreamData {
	type: string;
	data: {
	delta_content: string;
	phase: string;
	done: boolean;
	usage?: Usage;
	error?: UpstreamError;
	inner?: {
	error?: UpstreamError;
	};
	};
	error?: UpstreamError;
	}

	interface UpstreamError {
	detail: string;
	code: number;
	}

	interface ModelsResponse {
	object: string;
	data: Model[];
	}

	interface Model {
	id: string;
	object: string;
	created: number;
	owned_by: string;
	}

	/**
	* 配置常量定义
	*/

	// 思考内容处理策略: strip-去除<details>标签, think-转为<thinking>标签, raw-保留原样
	const THINK_TAGS_MODE = "strip";

	// 伪装前端头部（来自抓包分析）
	const X_FE_VERSION = "prod-fe-1.0.70";
	const BROWSER_UA = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/139.0.0.0 Safari/537.36 Edg/139.0.0.0";
	const SEC_CH_UA = "\"Not;A=Brand\";v=\"99\", \"Microsoft Edge\";v=\"139\", \"Chromium\";v=\"139\"";
	const SEC_CH_UA_MOB = "?0";
	const SEC_CH_UA_PLAT = "\"Windows\"";
	const ORIGIN_BASE = "https://chat.z.ai";

	const ANON_TOKEN_ENABLED = true;

	/**
	* 环境变量配置
	*/
	const UPSTREAM_URL = Deno.env.get("UPSTREAM_URL") \|\| "https://chat.z.ai/api/chat/completions";
	const DEFAULT_KEY = Deno.env.get("DEFAULT_KEY") \|\| "sk-your-key";
	const ZAI_TOKEN = Deno.env.get("ZAI_TOKEN") \|\| "";

	/**
	* 支持的模型配置
	*/
	interface ModelConfig {
	id: string; // OpenAI API中的模型ID
	name: string; // 显示名称
	upstreamId: string; // Z.ai上游的模型ID
	capabilities: {
	vision: boolean;
	mcp: boolean;
	thinking: boolean;
	};
	defaultParams: {
	top_p: number;
	temperature: number;
	max_tokens?: number;
	};
	}

	const SUPPORTED_MODELS: ModelConfig[] = [
	{
	id: "0727-360B-API",
	name: "GLM-4.5",
	upstreamId: "0727-360B-API",
	capabilities: {
	vision: false,
	mcp: true,
	thinking: true
	},
	defaultParams: {
	top_p: 0.95,
	temperature: 0.6,
	max_tokens: 80000
	}
	},
	{
	id: "glm-4.5v",
	name: "GLM-4.5V",
	upstreamId: "glm-4.5v",
	capabilities: {
	vision: true,
	mcp: false,
	thinking: true
	},
	defaultParams: {
	top_p: 0.6,
	temperature: 0.8
	}
	}
	];

	// 默认模型
	const DEFAULT_MODEL = SUPPORTED_MODELS[0];

	// 根据模型ID获取配置
	function getModelConfig(modelId: string): ModelConfig {
	// 标准化模型ID，处理Cherry Studio等客户端的大小写差异
	const normalizedModelId = normalizeModelId(modelId);
	const found = SUPPORTED_MODELS.find(m => m.id === normalizedModelId);

	if (!found) {
	debugLog("⚠️ 未找到模型配置: %s (标准化后: %s)，使用默认模型: %s",
	modelId, normalizedModelId, DEFAULT_MODEL.name);
	}

	return found \|\| DEFAULT_MODEL;
	}

	/**
	* 标准化模型ID，处理不同客户端的命名差异
	* Cherry Studio等客户端可能使用不同的大小写格式
	*/
	function normalizeModelId(modelId: string): string {
	const normalized = modelId.toLowerCase().trim();

	// 处理常见的模型ID映射
	const modelMappings: Record<string, string> = {
	'glm-4.5v': 'glm-4.5v',
	'glm4.5v': 'glm-4.5v',
	'glm_4.5v': 'glm-4.5v',
	'gpt-4-vision-preview': 'glm-4.5v', // 向后兼容
	'0727-360b-api': '0727-360B-API',
	'glm-4.5': '0727-360B-API',
	'glm4.5': '0727-360B-API',
	'glm_4.5': '0727-360B-API',
	'gpt-4': '0727-360B-API' // 向后兼容
	};

	const mapped = modelMappings[normalized];
	if (mapped) {
	debugLog("🔄 模型ID映射: %s → %s", modelId, mapped);
	return mapped;
	}

	return normalized;
	}

	/**
	* 处理和验证全方位多模态消息
	* 支持图像、视频、文档、音频等多种媒体类型
	*/
	function processMessages(messages: Message[], modelConfig: ModelConfig): Message[] {
	const processedMessages: Message[] = [];

	for (const message of messages) {
	const processedMessage: Message = { ...message };

	// 检查是否为多模态消息
	if (Array.isArray(message.content)) {
	debugLog("检测到多模态消息，内容块数量: %d", message.content.length);

	// 统计各种媒体类型
	const mediaStats = {
	text: 0,
	images: 0,
	videos: 0,
	documents: 0,
	audios: 0,
	others: 0
	};

	// 验证模型是否支持多模态
	if (!modelConfig.capabilities.vision) {
	debugLog("警告: 模型 %s 不支持多模态，但收到了多模态消息", modelConfig.name);
	// 只保留文本内容
	const textContent = message.content
	.filter(block => block.type === 'text')
	.map(block => block.text)
	.join('\n');
	processedMessage.content = textContent;
	} else {
	// GLM-4.5V 支持全方位多模态，处理所有内容类型
	for (const block of message.content) {
	switch (block.type) {
	case 'text':
	if (block.text) {
	mediaStats.text++;
	debugLog("📝 文本内容，长度: %d", block.text.length);
	}
	break;

	case 'image_url':
	if (block.image_url?.url) {
	mediaStats.images++;
	const url = block.image_url.url;
	if (url.startsWith('data:image/')) {
	const mimeMatch = url.match(/data:image\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	debugLog("🖼️ 图像数据: %s格式, 大小: %d字符", format, url.length);
	} else if (url.startsWith('http')) {
	debugLog("🔗 图像URL: %s", url);
	} else {
	debugLog("⚠️ 未知图像格式: %s", url.substring(0, 50));
	}
	}
	break;

	case 'video_url':
	if (block.video_url?.url) {
	mediaStats.videos++;
	const url = block.video_url.url;
	if (url.startsWith('data:video/')) {
	const mimeMatch = url.match(/data:video\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	debugLog("🎥 视频数据: %s格式, 大小: %d字符", format, url.length);
	} else if (url.startsWith('http')) {
	debugLog("🔗 视频URL: %s", url);
	} else {
	debugLog("⚠️ 未知视频格式: %s", url.substring(0, 50));
	}
	}
	break;

	case 'document_url':
	if (block.document_url?.url) {
	mediaStats.documents++;
	const url = block.document_url.url;
	if (url.startsWith('data:application/')) {
	const mimeMatch = url.match(/data:application\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	debugLog("📄 文档数据: %s格式, 大小: %d字符", format, url.length);
	} else if (url.startsWith('http')) {
	debugLog("🔗 文档URL: %s", url);
	} else {
	debugLog("⚠️ 未知文档格式: %s", url.substring(0, 50));
	}
	}
	break;

	case 'audio_url':
	if (block.audio_url?.url) {
	mediaStats.audios++;
	const url = block.audio_url.url;
	if (url.startsWith('data:audio/')) {
	const mimeMatch = url.match(/data:audio\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	debugLog("🎵 音频数据: %s格式, 大小: %d字符", format, url.length);
	} else if (url.startsWith('http')) {
	debugLog("🔗 音频URL: %s", url);
	} else {
	debugLog("⚠️ 未知音频格式: %s", url.substring(0, 50));
	}
	}
	break;

	default:
	mediaStats.others++;
	debugLog("❓ 未知内容类型: %s", block.type);
	}
	}

	// 输出统计信息
	const totalMedia = mediaStats.images + mediaStats.videos + mediaStats.documents + mediaStats.audios;
	if (totalMedia > 0) {
	debugLog("🎯 多模态内容统计: 文本(%d) 图像(%d) 视频(%d) 文档(%d) 音频(%d)",
	mediaStats.text, mediaStats.images, mediaStats.videos, mediaStats.documents, mediaStats.audios);
	}
	}
	} else if (typeof message.content === 'string') {
	debugLog("📝 纯文本消息，长度: %d", message.content.length);
	}

	processedMessages.push(processedMessage);
	}

	return processedMessages;
	}

	const DEBUG_MODE = Deno.env.get("DEBUG_MODE") !== "false"; // 默认为true
	const DEFAULT_STREAM = Deno.env.get("DEFAULT_STREAM") !== "false"; // 默认为true
	const DASHBOARD_ENABLED = Deno.env.get("DASHBOARD_ENABLED") !== "false"; // 默认为true

	/**
	* 全局状态变量
	*/

	let stats: RequestStats = {
	totalRequests: 0,
	successfulRequests: 0,
	failedRequests: 0,
	lastRequestTime: new Date(),
	averageResponseTime: 0
	};

	let liveRequests: LiveRequest[] = [];

	/**
	* 工具函数
	*/

	function debugLog(format: string, ...args: unknown[]): void {
	if (DEBUG_MODE) {
	console.log(`[DEBUG] ${format}`, ...args);
	}
	}

	function recordRequestStats(startTime: number, path: string, status: number): void {
	const duration = Date.now() - startTime;

	stats.totalRequests++;
	stats.lastRequestTime = new Date();

	if (status >= 200 && status < 300) {
	stats.successfulRequests++;
	} else {
	stats.failedRequests++;
	}

	// 更新平均响应时间
	if (stats.totalRequests > 0) {
	const totalDuration = stats.averageResponseTime * (stats.totalRequests - 1) + duration;
	stats.averageResponseTime = totalDuration / stats.totalRequests;
	} else {
	stats.averageResponseTime = duration;
	}
	}

	function addLiveRequest(method: string, path: string, status: number, duration: number, userAgent: string, model?: string): void {
	const request: LiveRequest = {
	id: Date.now().toString(),
	timestamp: new Date(),
	method,
	path,
	status,
	duration,
	userAgent,
	model
	};

	liveRequests.push(request);

	// 只保留最近的100条请求
	if (liveRequests.length > 100) {
	liveRequests = liveRequests.slice(1);
	}
	}

	function getLiveRequestsData(): string {
	try {
	// 确保liveRequests是数组
	if (!Array.isArray(liveRequests)) {
	debugLog("liveRequests不是数组，重置为空数组");
	liveRequests = [];
	}

	// 确保返回的数据格式与前端期望的一致
	const requestData = liveRequests.map(req => ({
	id: req.id \|\| "",
	timestamp: req.timestamp \|\| new Date(),
	method: req.method \|\| "",
	path: req.path \|\| "",
	status: req.status \|\| 0,
	duration: req.duration \|\| 0,
	user_agent: req.userAgent \|\| ""
	}));

	return JSON.stringify(requestData);
	} catch (error) {
	debugLog("获取实时请求数据失败: %v", error);
	return JSON.stringify([]);
	}
	}

	function getStatsData(): string {
	try {
	// 确保stats对象存在
	if (!stats) {
	debugLog("stats对象不存在，使用默认值");
	stats = {
	totalRequests: 0,
	successfulRequests: 0,
	failedRequests: 0,
	lastRequestTime: new Date(),
	averageResponseTime: 0
	};
	}

	// 确保返回的数据格式与前端期望的一致
	const statsData = {
	totalRequests: stats.totalRequests \|\| 0,
	successfulRequests: stats.successfulRequests \|\| 0,
	failedRequests: stats.failedRequests \|\| 0,
	averageResponseTime: stats.averageResponseTime \|\| 0
	};

	return JSON.stringify(statsData);
	} catch (error) {
	debugLog("获取统计数据失败: %v", error);
	return JSON.stringify({
	totalRequests: 0,
	successfulRequests: 0,
	failedRequests: 0,
	averageResponseTime: 0
	});
	}
	}

	function getClientIP(request: Request): string {
	// 检查X-Forwarded-For头
	const xff = request.headers.get("X-Forwarded-For");
	if (xff) {
	const ips = xff.split(",");
	if (ips.length > 0) {
	return ips[0].trim();
	}
	}

	// 检查X-Real-IP头
	const xri = request.headers.get("X-Real-IP");
	if (xri) {
	return xri;
	}

	// 对于Deno Deploy，我们无法直接获取RemoteAddr，返回一个默认值
	return "unknown";
	}

	function setCORSHeaders(headers: Headers): void {
	headers.set("Access-Control-Allow-Origin", "*");
	headers.set("Access-Control-Allow-Methods", "GET, POST, PUT, DELETE, OPTIONS");
	headers.set("Access-Control-Allow-Headers", "Content-Type, Authorization");
	headers.set("Access-Control-Allow-Credentials", "true");
	}

	function validateApiKey(authHeader: string \| null): boolean {
	if (!authHeader \|\| !authHeader.startsWith("Bearer ")) {
	return false;
	}

	const apiKey = authHeader.substring(7);
	return apiKey === DEFAULT_KEY;
	}

	async function getAnonymousToken(): Promise<string> {
	try {
	const response = await fetch(`${ORIGIN_BASE}/api/v1/auths/`, {
	method: "GET",
	headers: {
	"User-Agent": BROWSER_UA,
	"Accept": "/",
	"Accept-Language": "zh-CN,zh;q=0.9",
	"X-FE-Version": X_FE_VERSION,
	"sec-ch-ua": SEC_CH_UA,
	"sec-ch-ua-mobile": SEC_CH_UA_MOB,
	"sec-ch-ua-platform": SEC_CH_UA_PLAT,
	"Origin": ORIGIN_BASE,
	"Referer": `${ORIGIN_BASE}/`
	}
	});

	if (!response.ok) {
	throw new Error(`Anonymous token request failed with status ${response.status}`);
	}

	const data = await response.json() as { token: string };
	if (!data.token) {
	throw new Error("Anonymous token is empty");
	}

	return data.token;
	} catch (error) {
	debugLog("获取匿名token失败: %v", error);
	throw error;
	}
	}

	// 调用上游API
	async function callUpstreamWithHeaders(
	upstreamReq: UpstreamRequest,
	refererChatID: string,
	authToken: string
	): Promise<Response> {
	try {
	debugLog("调用上游API: %s", UPSTREAM_URL);

	// 特别检查和记录全方位多模态内容
	const hasMultimedia = upstreamReq.messages.some(msg =>
	Array.isArray(msg.content) &&
	msg.content.some(block =>
	['image_url', 'video_url', 'document_url', 'audio_url'].includes(block.type)
	)
	);

	if (hasMultimedia) {
	debugLog("🎯 请求包含多模态数据，正在发送到上游...");

	for (let i = 0; i < upstreamReq.messages.length; i++) {
	const msg = upstreamReq.messages[i];
	if (Array.isArray(msg.content)) {
	for (let j = 0; j < msg.content.length; j++) {
	const block = msg.content[j];

	// 处理图像
	if (block.type === 'image_url' && block.image_url?.url) {
	const url = block.image_url.url;
	if (url.startsWith('data:image/')) {
	const mimeMatch = url.match(/data:image\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	const sizeKB = Math.round(url.length * 0.75 / 1024); // base64 大约是原文件的 1.33 倍
	debugLog("🖼️ 消息[%d] 图像[%d]: %s格式, 数据长度: %d字符 (~%dKB)",
	i, j, format, url.length, sizeKB);

	// 图片大小警告
	if (sizeKB > 1000) {
	debugLog("⚠️ 图片较大 (%dKB)，可能导致上游处理失败", sizeKB);
	debugLog("💡 建议: 将图片压缩到 500KB 以下");
	} else if (sizeKB > 500) {
	debugLog("⚠️ 图片偏大 (%dKB)，建议压缩", sizeKB);
	}
	} else {
	debugLog("🔗 消息[%d] 图像[%d]: 外部URL - %s", i, j, url);
	}
	}

	// 处理视频
	if (block.type === 'video_url' && block.video_url?.url) {
	const url = block.video_url.url;
	if (url.startsWith('data:video/')) {
	const mimeMatch = url.match(/data:video\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	debugLog("🎥 消息[%d] 视频[%d]: %s格式, 数据长度: %d字符",
	i, j, format, url.length);
	} else {
	debugLog("🔗 消息[%d] 视频[%d]: 外部URL - %s", i, j, url);
	}
	}

	// 处理文档
	if (block.type === 'document_url' && block.document_url?.url) {
	const url = block.document_url.url;
	if (url.startsWith('data:application/')) {
	const mimeMatch = url.match(/data:application\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	debugLog("📄 消息[%d] 文档[%d]: %s格式, 数据长度: %d字符",
	i, j, format, url.length);
	} else {
	debugLog("🔗 消息[%d] 文档[%d]: 外部URL - %s", i, j, url);
	}
	}

	// 处理音频
	if (block.type === 'audio_url' && block.audio_url?.url) {
	const url = block.audio_url.url;
	if (url.startsWith('data:audio/')) {
	const mimeMatch = url.match(/data:audio\/([^;]+)/);
	const format = mimeMatch ? mimeMatch[1] : 'unknown';
	debugLog("🎵 消息[%d] 音频[%d]: %s格式, 数据长度: %d字符",
	i, j, format, url.length);
	} else {
	debugLog("🔗 消息[%d] 音频[%d]: 外部URL - %s", i, j, url);
	}
	}
	}
	}
	}
	}

	debugLog("上游请求体: %s", JSON.stringify(upstreamReq));

	const response = await fetch(UPSTREAM_URL, {
	method: "POST",
	headers: {
	"Content-Type": "application/json",
	"Accept": "application/json, text/event-stream",
	"User-Agent": BROWSER_UA,
	"Authorization": `Bearer ${authToken}`,
	"Accept-Language": "zh-CN",
	"sec-ch-ua": SEC_CH_UA,
	"sec-ch-ua-mobile": SEC_CH_UA_MOB,
	"sec-ch-ua-platform": SEC_CH_UA_PLAT,
	"X-FE-Version": X_FE_VERSION,
	"Origin": ORIGIN_BASE,
	"Referer": `${ORIGIN_BASE}/c/${refererChatID}`
	},
	body: JSON.stringify(upstreamReq)
	});

	debugLog("上游响应状态: %d %s", response.status, response.statusText);
	return response;
	} catch (error) {
	debugLog("调用上游失败: %v", error);
	throw error;
	}
	}

	function transformThinking(content: string): string {
	// 去 <summary>…</summary>
	let result = content.replace(/<summary>.*?<\/summary>/gs, "");
	// 清理残留自定义标签，如 </thinking>、<Full> 等
	result = result.replace(/<\/thinking>/g, "");
	result = result.replace(/<Full>/g, "");
	result = result.replace(/<\/Full>/g, "");
	result = result.trim();

	switch (THINK_TAGS_MODE as "strip" \| "think" \| "raw") {
	case "think":
	result = result.replace(/<details[^>]*>/g, "<thinking>");
	result = result.replace(/<\/details>/g, "</thinking>");
	break;
	case "strip":
	result = result.replace(/<details[^>]*>/g, "");
	result = result.replace(/<\/details>/g, "");
	break;
	}

	// 处理每行前缀 "> "（包括起始位置）
	result = result.replace(/^> /, "");
	result = result.replace(/\n> /g, "\n");
	return result.trim();
	}

	async function processUpstreamStream(
	body: ReadableStream<Uint8Array>,
	writer: WritableStreamDefaultWriter<Uint8Array>,
	encoder: TextEncoder,
	modelName: string
	): Promise<void> {
	const reader = body.getReader();
	const decoder = new TextDecoder();
	let buffer = "";

	try {
	while (true) {
	const { done, value } = await reader.read();
	if (done) break;

	buffer += decoder.decode(value, { stream: true });
	const lines = buffer.split('\n');
	buffer = lines.pop() \|\| ""; // 保留最后一个不完整的行

	for (const line of lines) {
	if (line.startsWith("data: ")) {
	const dataStr = line.substring(6);
	if (dataStr === "") continue;

	debugLog("收到SSE数据: %s", dataStr);

	try {
	const upstreamData = JSON.parse(dataStr) as UpstreamData;

	// 错误检测
	if (upstreamData.error \|\| upstreamData.data.error \|\|
	(upstreamData.data.inner && upstreamData.data.inner.error)) {
	const errObj = upstreamData.error \|\| upstreamData.data.error \|\|
	(upstreamData.data.inner && upstreamData.data.inner.error);
	debugLog("上游错误: code=%d, detail=%s", errObj?.code, errObj?.detail);

	// 分析错误类型，特别是多模态相关错误
	const errorDetail = (errObj?.detail \|\| "").toLowerCase();
	if (errorDetail.includes("something went wrong") \|\| errorDetail.includes("try again later")) {
	debugLog("🚨 Z.ai 服务器错误分析:");
	debugLog(" 📋 错误详情: %s", errObj?.detail);
	debugLog(" 🖼️ 可能原因: 图片处理失败");
	debugLog(" 💡 建议解决方案:");
	debugLog(" 1. 使用更小的图片 (< 500KB)");
	debugLog(" 2. 尝试不同的图片格式 (JPEG 而不是 PNG)");
	debugLog(" 3. 稍后重试 (可能是服务器负载问题)");
	debugLog(" 4. 检查图片是否损坏");
	}

	// 发送结束chunk
	const endChunk: OpenAIResponse = {
	id: `chatcmpl-${Date.now()}`,
	object: "chat.completion.chunk",
	created: Math.floor(Date.now() / 1000),
	model: modelName,
	choices: [
	{
	index: 0,
	delta: {},
	finish_reason: "stop"
	}
	]
	};

	await writer.write(encoder.encode(`data: ${JSON.stringify(endChunk)}\n\n`));
	await writer.write(encoder.encode("data: [DONE]\n\n"));
	return;
	}

	debugLog("解析成功 - 类型: %s, 阶段: %s, 内容长度: %d, 完成: %v",
	upstreamData.type, upstreamData.data.phase,
	upstreamData.data.delta_content ? upstreamData.data.delta_content.length : 0,
	upstreamData.data.done);

	// 处理内容
	if (upstreamData.data.delta_content && upstreamData.data.delta_content !== "") {
	let out = upstreamData.data.delta_content;
	if (upstreamData.data.phase === "thinking") {
	out = transformThinking(out);
	}

	if (out !== "") {
	debugLog("发送内容(%s): %s", upstreamData.data.phase, out);

	const chunk: OpenAIResponse = {
	id: `chatcmpl-${Date.now()}`,
	object: "chat.completion.chunk",
	created: Math.floor(Date.now() / 1000),
	model: modelName,
	choices: [
	{
	index: 0,
	delta: { content: out }
	}
	]
	};

	await writer.write(encoder.encode(`data: ${JSON.stringify(chunk)}\n\n`));
	}
	}

	// 检查是否结束
	if (upstreamData.data.done \|\| upstreamData.data.phase === "done") {
	debugLog("检测到流结束信号");

	// 发送结束chunk
	const endChunk: OpenAIResponse = {
	id: `chatcmpl-${Date.now()}`,
	object: "chat.completion.chunk",
	created: Math.floor(Date.now() / 1000),
	model: modelName,
	choices: [
	{
	index: 0,
	delta: {},
	finish_reason: "stop"
	}
	]
	};

	await writer.write(encoder.encode(`data: ${JSON.stringify(endChunk)}\n\n`));
	await writer.write(encoder.encode("data: [DONE]\n\n"));
	return;
	}
	} catch (error) {
	debugLog("SSE数据解析失败: %v", error);
	}
	}
	}
	}
	} finally {
	writer.close();
	}
	}

	// 收集完整响应（用于非流式响应）
	async function collectFullResponse(body: ReadableStream<Uint8Array>): Promise<string> {
	const reader = body.getReader();
	const decoder = new TextDecoder();
	let buffer = "";
	let fullContent = "";

	try {
	while (true) {
	const { done, value } = await reader.read();
	if (done) break;

	buffer += decoder.decode(value, { stream: true });
	const lines = buffer.split('\n');
	buffer = lines.pop() \|\| ""; // 保留最后一个不完整的行

	for (const line of lines) {
	if (line.startsWith("data: ")) {
	const dataStr = line.substring(6);
	if (dataStr === "") continue;

	try {
	const upstreamData = JSON.parse(dataStr) as UpstreamData;

	if (upstreamData.data.delta_content !== "") {
	let out = upstreamData.data.delta_content;
	if (upstreamData.data.phase === "thinking") {
	out = transformThinking(out);
	}

	if (out !== "") {
	fullContent += out;
	}
	}

	// 检查是否结束
	if (upstreamData.data.done \|\| upstreamData.data.phase === "done") {
	debugLog("检测到完成信号，停止收集");
	return fullContent;
	}
	} catch (error) {
	// 忽略解析错误
	}
	}
	}
	}
	} finally {
	reader.releaseLock();
	}

	return fullContent;
	}

	/**
	* HTTP服务器和路由处理
	*/

	function getIndexHTML(): string {
	return `<!DOCTYPE html>
	<html lang="zh-CN">
	<head>
	<meta charset="UTF-8">
	<meta name="viewport" content="width=device-width, initial-scale=1.0">
	<title>ZtoApi - OpenAI兼容API代理</title>
	<style>
	body {
	font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
	margin: 0;
	padding: 0;
	background-color: #f5f5f5;
	line-height: 1.6;
	}
	.container {
	max-width: 1200px;
	margin: 0 auto;
	background-color: white;
	border-radius: 8px;
	box-shadow: 0 2px 10px rgba(0,0,0,0.1);
	padding: 40px;
	margin-top: 40px;
	}
	header {
	text-align: center;
	margin-bottom: 40px;
	}
	h1 {
	color: #333;
	margin-bottom: 10px;
	font-size: 2.5rem;
	}
	.subtitle {
	color: #666;
	font-size: 1.2rem;
	margin-bottom: 30px;
	}
	.links {
	display: grid;
	grid-template-columns: repeat(auto-fit, minmax(300px, 1fr));
	gap: 20px;
	margin-top: 40px;
	}
	.link-card {
	background-color: #f8f9fa;
	border-radius: 8px;
	padding: 20px;
	text-align: center;
	transition: transform 0.3s ease, box-shadow 0.3s ease;
	border: 1px solid #e9ecef;
	}
	.link-card:hover {
	transform: translateY(-5px);
	box-shadow: 0 5px 15px rgba(0,0,0,0.1);
	}
	.link-card h3 {
	margin-top: 0;
	color: #007bff;
	}
	.link-card p {
	color: #666;
	margin-bottom: 20px;
	}
	.link-card a {
	display: inline-block;
	background-color: #007bff;
	color: white;
	padding: 10px 20px;
	border-radius: 4px;
	text-decoration: none;
	font-weight: bold;
	transition: background-color 0.3s ease;
	}
	.link-card a:hover {
	background-color: #0056b3;
	}
	.features {
	margin-top: 60px;
	}
	.features h2 {
	text-align: center;
	color: #333;
	margin-bottom: 30px;
	}
	.feature-list {
	display: grid;
	grid-template-columns: repeat(auto-fit, minmax(250px, 1fr));
	gap: 20px;
	}
	.feature-item {
	text-align: center;
	padding: 20px;
	}
	.feature-item i {
	font-size: 2rem;
	color: #007bff;
	margin-bottom: 15px;
	}
	.feature-item h3 {
	color: #333;
	margin-bottom: 10px;
	}
	.feature-item p {
	color: #666;
	}
	footer {
	text-align: center;
	margin-top: 60px;
	padding-top: 20px;
	border-top: 1px solid #e9ecef;
	color: #666;
	}
	</style>
	</head>
	<body>
	<div class="container">
	<header>
	<h1>ZtoApi</h1>
	<div class="subtitle">OpenAI兼容API代理 for Z.ai GLM-4.5</div>
	<p>一个高性能、易于部署的API代理服务，让你能够使用OpenAI兼容的格式访问Z.ai的GLM-4.5模型。</p>
	</header>

	<div class="links">
	<div class="link-card">
	<h3>📖 API文档</h3>
	<p>查看完整的API文档，了解如何使用本服务。</p>
	<a href="/docs">查看文档</a>
	</div>

	<div class="link-card">
	<h3>📊 API调用看板</h3>
	<p>实时监控API调用情况，查看请求统计和性能指标。</p>
	<a href="/dashboard">查看看板</a>
	</div>

	<div class="link-card">
	<h3>🤖 模型列表</h3>
	<p>查看可用的AI模型列表及其详细信息。</p>
	<a href="/v1/models">查看模型</a>
	</div>
	</div>

	<div class="features">
	<h2>功能特性</h2>
	<div class="feature-list">
	<div class="feature-item">
	<div>🔄</div>
	<h3>OpenAI API兼容</h3>
	<p>完全兼容OpenAI的API格式，无需修改客户端代码</p>
	</div>

	<div class="feature-item">
	<div>🌊</div>
	<h3>流式响应支持</h3>
	<p>支持实时流式输出，提供更好的用户体验</p>
	</div>

	<div class="feature-item">
	<div>🔐</div>
	<h3>身份验证</h3>
	<p>支持API密钥验证，确保服务安全</p>
	</div>

	<div class="feature-item">
	<div>🛠️</div>
	<h3>灵活配置</h3>
	<p>通过环境变量进行灵活配置</p>
	</div>

	<div class="feature-item">
	<div>📝</div>
	<h3>思考过程展示</h3>
	<p>智能处理并展示模型的思考过程</p>
	</div>

	<div class="feature-item">
	<div>📊</div>
	<h3>实时监控</h3>
	<p>提供Web仪表板，实时显示API转发情况和统计信息</p>
	</div>
	</div>
	</div>

	<footer>
	<p>© 2024 ZtoApi. Powered by Deno & Z.ai GLM-4.5</p>
	</footer>
	</div>
	</body>
	</html>`;
	}

	async function handleIndex(request: Request): Promise<Response> {
	if (request.method !== "GET") {
	return new Response("Method not allowed", { status: 405 });
	}

	return new Response(getIndexHTML(), {
	status: 200,
	headers: {
	"Content-Type": "text/html; charset=utf-8"
	}
	});
	}

	async function handleOptions(request: Request): Promise<Response> {
	const headers = new Headers();
	setCORSHeaders(headers);

	if (request.method === "OPTIONS") {
	return new Response(null, { status: 200, headers });
	}

	return new Response("Not Found", { status: 404, headers });
	}

	async function handleModels(request: Request): Promise<Response> {
	const headers = new Headers();
	setCORSHeaders(headers);

	if (request.method === "OPTIONS") {
	return new Response(null, { status: 200, headers });
	}

	// 支持的模型
	const models = SUPPORTED_MODELS.map(model => ({
	id: model.name,
	object: "model",
	created: Math.floor(Date.now() / 1000),
	owned_by: "z.ai"
	}));

	const response: ModelsResponse = {
	object: "list",
	data: models
	};

	headers.set("Content-Type", "application/json");
	return new Response(JSON.stringify(response), {
	status: 200,
	headers
	});
	}

	async function handleChatCompletions(request: Request): Promise<Response> {
	const startTime = Date.now();
	const url = new URL(request.url);
	const path = url.pathname;
	const userAgent = request.headers.get("User-Agent") \|\| "";

	debugLog("收到chat completions请求");
	debugLog("🌐 User-Agent: %s", userAgent);

	// Cherry Studio 检测
	const isCherryStudio = userAgent.toLowerCase().includes('cherry') \|\| userAgent.toLowerCase().includes('studio');
	if (isCherryStudio) {
	debugLog("🍒 检测到 Cherry Studio 客户端版本: %s",
	userAgent.match(/CherryStudio\/([^\s]+)/)?.[1] \|\| 'unknown');
	}

	const headers = new Headers();
	setCORSHeaders(headers);

	if (request.method === "OPTIONS") {
	return new Response(null, { status: 200, headers });
	}

	// 验证API Key
	const authHeader = request.headers.get("Authorization");
	if (!validateApiKey(authHeader)) {
	debugLog("缺少或无效的Authorization头");
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 401);
	addLiveRequest(request.method, path, 401, duration, userAgent);
	return new Response("Missing or invalid Authorization header", {
	status: 401,
	headers
	});
	}

	debugLog("API key验证通过");

	// 读取请求体
	let body: string;
	try {
	body = await request.text();
	debugLog("📥 收到请求体长度: %d 字符", body.length);

	// 为Cherry Studio调试：记录原始请求体（截取前1000字符避免日志过长）
	const bodyPreview = body.length > 1000 ? body.substring(0, 1000) + "..." : body;
	debugLog("📄 请求体预览: %s", bodyPreview);
	} catch (error) {
	debugLog("读取请求体失败: %v", error);
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 400);
	addLiveRequest(request.method, path, 400, duration, userAgent);
	return new Response("Failed to read request body", {
	status: 400,
	headers
	});
	}

	// 解析请求
	let req: OpenAIRequest;
	try {
	req = JSON.parse(body) as OpenAIRequest;
	debugLog("✅ JSON解析成功");
	} catch (error) {
	debugLog("JSON解析失败: %v", error);
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 400);
	addLiveRequest(request.method, path, 400, duration, userAgent);
	return new Response("Invalid JSON", {
	status: 400,
	headers
	});
	}

	// 如果客户端没有明确指定stream参数，使用默认值
	if (!body.includes('"stream"')) {
	req.stream = DEFAULT_STREAM;
	debugLog("客户端未指定stream参数，使用默认值: %v", DEFAULT_STREAM);
	}

	// 获取模型配置
	const modelConfig = getModelConfig(req.model);
	debugLog("请求解析成功 - 模型: %s (%s), 流式: %v, 消息数: %d", req.model, modelConfig.name, req.stream, req.messages.length);

	// Cherry Studio 调试：详细检查每条消息
	debugLog("🔍 Cherry Studio 调试 - 检查原始消息:");
	for (let i = 0; i < req.messages.length; i++) {
	const msg = req.messages[i];
	debugLog(" 消息[%d] role: %s", i, msg.role);

	if (typeof msg.content === 'string') {
	debugLog(" 消息[%d] content: 字符串类型, 长度: %d", i, msg.content.length);
	if (msg.content.length === 0) {
	debugLog(" ⚠️ 消息[%d] 内容为空字符串!", i);
	} else {
	debugLog(" 消息[%d] 内容预览: %s", i, msg.content.substring(0, 100));
	}
	} else if (Array.isArray(msg.content)) {
	debugLog(" 消息[%d] content: 数组类型, 块数: %d", i, msg.content.length);
	for (let j = 0; j < msg.content.length; j++) {
	const block = msg.content[j];
	debugLog(" 块[%d] type: %s", j, block.type);
	if (block.type === 'text' && block.text) {
	debugLog(" 块[%d] text: %s", j, block.text.substring(0, 50));
	} else if (block.type === 'image_url' && block.image_url?.url) {
	debugLog(" 块[%d] image_url: %s格式, 长度: %d", j,
	block.image_url.url.startsWith('data:') ? 'base64' : 'url',
	block.image_url.url.length);
	}
	}
	} else {
	debugLog(" ⚠️ 消息[%d] content 类型异常: %s", i, typeof msg.content);
	}
	}

	// 处理和验证消息（特别是多模态内容）
	const processedMessages = processMessages(req.messages, modelConfig);
	debugLog("消息处理完成，处理后消息数: %d", processedMessages.length);

	// 检查是否包含多模态内容
	const hasMultimodal = processedMessages.some(msg =>
	Array.isArray(msg.content) &&
	msg.content.some(block =>
	['image_url', 'video_url', 'document_url', 'audio_url'].includes(block.type)
	)
	);

	if (hasMultimodal) {
	debugLog("🎯 检测到全方位多模态请求，模型: %s", modelConfig.name);
	if (!modelConfig.capabilities.vision) {
	debugLog("❌ 严重错误: 模型不支持多模态，但收到了多媒体内容！");
	debugLog("💡 Cherry Studio用户请检查: 确认选择了 'glm-4.5v' 而不是 'GLM-4.5'");
	debugLog("🔧 模型映射状态: %s → %s (vision: %s)",
	req.model, modelConfig.upstreamId, modelConfig.capabilities.vision);
	} else {
	debugLog("✅ GLM-4.5V支持全方位多模态理解：图像、视频、文档、音频");

	// 检查是否使用匿名token（多模态功能的重要限制）
	if (!ZAI_TOKEN \|\| ZAI_TOKEN.trim() === "") {
	debugLog("⚠️ 重要警告: 正在使用匿名token处理多模态请求");
	debugLog("💡 Z.ai的匿名token可能不支持图像/视频/文档处理");
	debugLog("🔧 解决方案: 设置 ZAI_TOKEN 环境变量为正式的API Token");
	debugLog("📋 如果请求失败，这很可能是token权限问题");
	} else {
	debugLog("✅ 使用正式API Token，支持完整多模态功能");
	}
	}
	} else if (modelConfig.capabilities.vision && modelConfig.id === 'glm-4.5v') {
	debugLog("ℹ️ 使用GLM-4.5V模型但未检测到多媒体数据，仅处理文本内容");
	}

	// 生成会话相关ID
	const chatID = `${Date.now()}-${Math.floor(Date.now() / 1000)}`;
	const msgID = Date.now().toString();

	// 构造上游请求
	const upstreamReq: UpstreamRequest = {
	stream: true, // 总是使用流式从上游获取
	chat_id: chatID,
	id: msgID,
	model: modelConfig.upstreamId,
	messages: processedMessages,
	params: modelConfig.defaultParams,
	features: {
	enable_thinking: modelConfig.capabilities.thinking,
	image_generation: false,
	web_search: false,
	auto_web_search: false,
	preview_mode: modelConfig.capabilities.vision
	},
	background_tasks: {
	title_generation: false,
	tags_generation: false
	},
	mcp_servers: modelConfig.capabilities.mcp ? [] : undefined,
	model_item: {
	id: modelConfig.upstreamId,
	name: modelConfig.name,
	owned_by: "openai",
	openai: {
	id: modelConfig.upstreamId,
	name: modelConfig.upstreamId,
	owned_by: "openai",
	openai: {
	id: modelConfig.upstreamId
	},
	urlIdx: 1
	},
	urlIdx: 1,
	info: {
	id: modelConfig.upstreamId,
	user_id: "api-user",
	base_model_id: null,
	name: modelConfig.name,
	params: modelConfig.defaultParams,
	meta: {
	profile_image_url: "/static/favicon.png",
	description: modelConfig.capabilities.vision ? "Advanced visual understanding and analysis" : "Most advanced model, proficient in coding and tool use",
	capabilities: {
	vision: modelConfig.capabilities.vision,
	citations: false,
	preview_mode: modelConfig.capabilities.vision,
	web_search: false,
	language_detection: false,
	restore_n_source: false,
	mcp: modelConfig.capabilities.mcp,
	file_qa: modelConfig.capabilities.mcp,
	returnFc: true,
	returnThink: modelConfig.capabilities.thinking,
	think: modelConfig.capabilities.thinking
	}
	}
	}
	},
	tool_servers: [],
	variables: {
	"{{USER_NAME}}": `Guest-${Date.now()}`,
	"{{USER_LOCATION}}": "Unknown",
	"{{CURRENT_DATETIME}}": new Date().toLocaleString('zh-CN'),
	"{{CURRENT_DATE}}": new Date().toLocaleDateString('zh-CN'),
	"{{CURRENT_TIME}}": new Date().toLocaleTimeString('zh-CN'),
	"{{CURRENT_WEEKDAY}}": new Date().toLocaleDateString('zh-CN', { weekday: 'long' }),
	"{{CURRENT_TIMEZONE}}": "Asia/Shanghai",
	"{{USER_LANGUAGE}}": "zh-CN"
	}
	};

	// 选择本次对话使用的token
	let authToken = ZAI_TOKEN;
	if (ANON_TOKEN_ENABLED) {
	try {
	const anonToken = await getAnonymousToken();
	authToken = anonToken;
	debugLog("匿名token获取成功: %s...", anonToken.substring(0, 10));
	} catch (error) {
	debugLog("匿名token获取失败，回退固定token: %v", error);
	}
	}

	// 调用上游API
	try {
	if (req.stream) {
	return await handleStreamResponse(upstreamReq, chatID, authToken, startTime, path, userAgent, req, modelConfig);
	} else {
	return await handleNonStreamResponse(upstreamReq, chatID, authToken, startTime, path, userAgent, req, modelConfig);
	}
	} catch (error) {
	debugLog("调用上游失败: %v", error);
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 502);
	addLiveRequest(request.method, path, 502, duration, userAgent);
	return new Response("Failed to call upstream", {
	status: 502,
	headers
	});
	}
	}

	async function handleStreamResponse(
	upstreamReq: UpstreamRequest,
	chatID: string,
	authToken: string,
	startTime: number,
	path: string,
	userAgent: string,
	req: OpenAIRequest,
	modelConfig: ModelConfig
	): Promise<Response> {
	debugLog("开始处理流式响应 (chat_id=%s)", chatID);

	try {
	const response = await callUpstreamWithHeaders(upstreamReq, chatID, authToken);

	if (!response.ok) {
	debugLog("上游返回错误状态: %d", response.status);
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 502);
	addLiveRequest("POST", path, 502, duration, userAgent);
	return new Response("Upstream error", { status: 502 });
	}

	if (!response.body) {
	debugLog("上游响应体为空");
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 502);
	addLiveRequest("POST", path, 502, duration, userAgent);
	return new Response("Upstream response body is empty", { status: 502 });
	}

	// 创建可读流
	const { readable, writable } = new TransformStream();
	const writer = writable.getWriter();
	const encoder = new TextEncoder();

	// 发送第一个chunk（role）
	const firstChunk: OpenAIResponse = {
	id: `chatcmpl-${Date.now()}`,
	object: "chat.completion.chunk",
	created: Math.floor(Date.now() / 1000),
	model: req.model,
	choices: [
	{
	index: 0,
	delta: { role: "assistant" }
	}
	]
	};

	// 写入第一个chunk
	writer.write(encoder.encode(`data: ${JSON.stringify(firstChunk)}\n\n`));

	// 处理上游SSE流
	processUpstreamStream(response.body, writer, encoder, req.model).catch(error => {
	debugLog("处理上游流时出错: %v", error);
	});

	// 记录成功请求统计
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 200);
	addLiveRequest("POST", path, 200, duration, userAgent, modelConfig.name);

	return new Response(readable, {
	status: 200,
	headers: {
	"Content-Type": "text/event-stream",
	"Cache-Control": "no-cache",
	"Connection": "keep-alive",
	"Access-Control-Allow-Origin": "*",
	"Access-Control-Allow-Methods": "GET, POST, PUT, DELETE, OPTIONS",
	"Access-Control-Allow-Headers": "Content-Type, Authorization",
	"Access-Control-Allow-Credentials": "true"
	}
	});
	} catch (error) {
	debugLog("处理流式响应时出错: %v", error);
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 502);
	addLiveRequest("POST", path, 502, duration, userAgent);
	return new Response("Failed to process stream response", { status: 502 });
	}
	}

	async function handleNonStreamResponse(
	upstreamReq: UpstreamRequest,
	chatID: string,
	authToken: string,
	startTime: number,
	path: string,
	userAgent: string,
	req: OpenAIRequest,
	modelConfig: ModelConfig
	): Promise<Response> {
	debugLog("开始处理非流式响应 (chat_id=%s)", chatID);

	try {
	const response = await callUpstreamWithHeaders(upstreamReq, chatID, authToken);

	if (!response.ok) {
	debugLog("上游返回错误状态: %d", response.status);
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 502);
	addLiveRequest("POST", path, 502, duration, userAgent);
	return new Response("Upstream error", { status: 502 });
	}

	if (!response.body) {
	debugLog("上游响应体为空");
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 502);
	addLiveRequest("POST", path, 502, duration, userAgent);
	return new Response("Upstream response body is empty", { status: 502 });
	}

	// 收集完整响应
	const finalContent = await collectFullResponse(response.body);
	debugLog("内容收集完成，最终长度: %d", finalContent.length);

	// 构造完整响应
	const openAIResponse: OpenAIResponse = {
	id: `chatcmpl-${Date.now()}`,
	object: "chat.completion",
	created: Math.floor(Date.now() / 1000),
	model: req.model,
	choices: [
	{
	index: 0,
	message: {
	role: "assistant",
	content: finalContent
	},
	finish_reason: "stop"
	}
	],
	usage: {
	prompt_tokens: 0,
	completion_tokens: 0,
	total_tokens: 0
	}
	};

	// 记录成功请求统计
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 200);
	addLiveRequest("POST", path, 200, duration, userAgent, modelConfig.name);

	return new Response(JSON.stringify(openAIResponse), {
	status: 200,
	headers: {
	"Content-Type": "application/json",
	"Access-Control-Allow-Origin": "*",
	"Access-Control-Allow-Methods": "GET, POST, PUT, DELETE, OPTIONS",
	"Access-Control-Allow-Headers": "Content-Type, Authorization",
	"Access-Control-Allow-Credentials": "true"
	}
	});
	} catch (error) {
	debugLog("处理非流式响应时出错: %v", error);
	const duration = Date.now() - startTime;
	recordRequestStats(startTime, path, 502);
	addLiveRequest("POST", path, 502, duration, userAgent);
	return new Response("Failed to process non-stream response", { status: 502 });
	}
	}

	/**
	* 生成 Dashboard 监控页面HTML模板
	* 提供实时API调用监控和统计信息展示
	* @returns string 完整的HTML页面内容
	*/
	function getDashboardHTML(): string {
	return `<!DOCTYPE html>
	<html lang="zh-CN">
	<head>
	<meta charset="UTF-8">
	<meta name="viewport" content="width=device-width, initial-scale=1.0">
	<title>API调用看板</title>
	<style>
	body {
	font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
	margin: 0;
	padding: 20px;
	background-color: #f5f5f5;
	}
	.container {
	max-width: 1200px;
	margin: 0 auto;
	background-color: white;
	border-radius: 8px;
	box-shadow: 0 2px 10px rgba(0,0,0,0.1);
	padding: 20px;
	}
	h1 {
	color: #333;
	text-align: center;
	margin-bottom: 30px;
	}
	.stats-container {
	display: grid;
	grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
	gap: 20px;
	margin-bottom: 30px;
	}
	.stat-card {
	background-color: #f8f9fa;
	border-radius: 6px;
	padding: 15px;
	text-align: center;
	box-shadow: 0 1px 3px rgba(0,0,0,0.1);
	}
	.stat-value {
	font-size: 24px;
	font-weight: bold;
	color: #007bff;
	}
	.stat-label {
	font-size: 14px;
	color: #6c757d;
	margin-top: 5px;
	}
	.requests-container {
	margin-top: 30px;
	}
	.requests-table {
	width: 100%;
	border-collapse: collapse;
	}
	.requests-table th, .requests-table td {
	padding: 10px;
	text-align: left;
	border-bottom: 1px solid #ddd;
	}
	.requests-table th {
	background-color: #f8f9fa;
	}
	.status-success {
	color: #28a745;
	}
	.status-error {
	color: #dc3545;
	}
	.refresh-info {
	text-align: center;
	margin-top: 20px;
	color: #6c757d;
	font-size: 14px;
	}
	.pagination-container {
	display: flex;
	justify-content: center;
	align-items: center;
	margin-top: 20px;
	gap: 10px;
	}
	.pagination-container button {
	padding: 5px 10px;
	background-color: #007bff;
	color: white;
	border: none;
	border-radius: 4px;
	cursor: pointer;
	}
	.pagination-container button:disabled {
	background-color: #cccccc;
	cursor: not-allowed;
	}
	.pagination-container button:hover:not(:disabled) {
	background-color: #0056b3;
	}
	.chart-container {
	margin-top: 30px;
	height: 300px;
	background-color: #f8f9fa;
	border-radius: 6px;
	padding: 15px;
	box-shadow: 0 1px 3px rgba(0,0,0,0.1);
	}
	</style>
	</head>
	<body>
	<div class="container">
	<h1>API调用看板</h1>

	<div class="stats-container">
	<div class="stat-card">
	<div class="stat-value" id="total-requests">0</div>
	<div class="stat-label">总请求数</div>
	</div>
	<div class="stat-card">
	<div class="stat-value" id="successful-requests">0</div>
	<div class="stat-label">成功请求</div>
	</div>
	<div class="stat-card">
	<div class="stat-value" id="failed-requests">0</div>
	<div class="stat-label">失败请求</div>
	</div>
	<div class="stat-card">
	<div class="stat-value" id="avg-response-time">0s</div>
	<div class="stat-label">平均响应时间</div>
	</div>
	</div>

	<div class="chart-container">
	<h2>请求统计图表</h2>
	<canvas id="requestsChart"></canvas>
	</div>

	<div class="requests-container">
	<h2>实时请求</h2>
	<table class="requests-table">
	<thead>
	<tr>
	<th>时间</th>
	<th>模型</th>
	<th>方法</th>
	<th>状态</th>
	<th>耗时</th>
	<th>User Agent</th>
	</tr>
	</thead>
	<tbody id="requests-tbody">
	<!-- 请求记录将通过JavaScript动态添加 -->
	</tbody>
	</table>
	<div class="pagination-container">
	<button id="prev-page" disabled>上一页</button>
	<span id="page-info">第 1 页，共 1 页</span>
	<button id="next-page" disabled>下一页</button>
	</div>
	</div>

	<div class="refresh-info">
	数据每5秒自动刷新一次
	</div>
	</div>

	<script src="https://cdn.jsdelivr.net/npm/chart.js"></script>
	<script>
	// 全局变量
	let allRequests = [];
	let currentPage = 1;
	const itemsPerPage = 10;
	let requestsChart = null;

	// 更新统计数据
	function updateStats() {
	fetch('/dashboard/stats')
	.then(response => response.json())
	.then(data => {
	document.getElementById('total-requests').textContent = data.totalRequests \|\| 0;
	document.getElementById('successful-requests').textContent = data.successfulRequests \|\| 0;
	document.getElementById('failed-requests').textContent = data.failedRequests \|\| 0;
	document.getElementById('avg-response-time').textContent = ((data.averageResponseTime \|\| 0) / 1000).toFixed(2) + 's';
	})
	.catch(error => console.error('Error fetching stats:', error));
	}

	// 更新请求列表
	function updateRequests() {
	fetch('/dashboard/requests')
	.then(response => response.json())
	.then(data => {
	// 检查数据是否为数组
	if (!Array.isArray(data)) {
	console.error('返回的数据不是数组:', data);
	return;
	}

	// 保存所有请求数据
	allRequests = data;

	// 按时间倒序排列
	allRequests.sort((a, b) => {
	const timeA = new Date(a.timestamp);
	const timeB = new Date(b.timestamp);
	return timeB - timeA;
	});

	// 更新表格
	updateTable();

	// 更新图表
	updateChart();

	// 更新分页信息
	updatePagination();
	})
	.catch(error => console.error('Error fetching requests:', error));
	}

	// 更新表格显示
	function updateTable() {
	const tbody = document.getElementById('requests-tbody');
	tbody.innerHTML = '';

	// 计算当前页的数据范围
	const startIndex = (currentPage - 1) * itemsPerPage;
	const endIndex = startIndex + itemsPerPage;
	const currentRequests = allRequests.slice(startIndex, endIndex);

	currentRequests.forEach(request => {
	const row = document.createElement('tr');

	// 格式化时间 - 检查时间戳是否有效
	let timeStr = "Invalid Date";
	if (request.timestamp) {
	try {
	const time = new Date(request.timestamp);
	if (!isNaN(time.getTime())) {
	timeStr = time.toLocaleTimeString();
	}
	} catch (e) {
	console.error("时间格式化错误:", e);
	}
	}

	// 判断模型名称
	let modelName = "GLM-4.5";
	if (request.path && request.path.includes('glm-4.5v')) {
	modelName = "GLM-4.5V";
	} else if (request.model) {
	modelName = request.model;
	}

	// 状态样式
	const statusClass = request.status >= 200 && request.status < 300 ? 'status-success' : 'status-error';
	const status = request.status \|\| "undefined";

	// 截断 User Agent，避免过长
	let userAgent = request.user_agent \|\| "undefined";
	if (userAgent.length > 30) {
	userAgent = userAgent.substring(0, 30) + "...";
	}

	row.innerHTML = "<td>" + timeStr + "</td>" + "<td>" + modelName + "</td>" + "<td>" + (request.method \|\| "undefined") + "</td>" + "<td class='" + statusClass + "'>" + status + "</td>" + "<td>" + ((request.duration / 1000).toFixed(2) \|\| "undefined") + "s</td>" + "<td title='" + (request.user_agent \|\| "") + "'>" + userAgent + "</td>";

	tbody.appendChild(row);
	});
	}

	// 更新分页信息
	function updatePagination() {
	const totalPages = Math.ceil(allRequests.length / itemsPerPage);
	document.getElementById('page-info').textContent = "第 " + currentPage + " 页，共 " + totalPages + " 页";

	document.getElementById('prev-page').disabled = currentPage <= 1;
	document.getElementById('next-page').disabled = currentPage >= totalPages;
	}

	// 更新图表
	function updateChart() {
	const ctx = document.getElementById('requestsChart').getContext('2d');

	// 准备图表数据 - 最近20条请求的响应时间
	const chartData = allRequests.slice(0, 20).reverse();
	const labels = chartData.map(req => {
	const time = new Date(req.timestamp);
	return time.toLocaleTimeString();
	});
	const responseTimes = chartData.map(req => req.duration);

	// 如果图表已存在，先销毁
	if (requestsChart) {
	requestsChart.destroy();
	}

	// 创建新图表
	requestsChart = new Chart(ctx, {
	type: 'line',
	data: {
	labels: labels,
	datasets: [{
	label: '响应时间 (s)',
	data: responseTimes.map(time => time / 1000),
	borderColor: '#007bff',
	backgroundColor: 'rgba(0, 123, 255, 0.1)',
	tension: 0.1,
	fill: true
	}]
	},
	options: {
	responsive: true,
	maintainAspectRatio: false,
	scales: {
	y: {
	beginAtZero: true,
	title: {
	display: true,
	text: '响应时间 (s)'
	}
	},
	x: {
	title: {
	display: true,
	text: '时间'
	}
	}
	},
	plugins: {
	title: {
	display: true,
	text: '最近20条请求的响应时间趋势 (s)'
	}
	}
	}
	});
	}

	// 分页按钮事件
	document.getElementById('prev-page').addEventListener('click', function() {
	if (currentPage > 1) {
	currentPage--;
	updateTable();
	updatePagination();
	}
	});

	document.getElementById('next-page').addEventListener('click', function() {
	const totalPages = Math.ceil(allRequests.length / itemsPerPage);
	if (currentPage < totalPages) {
	currentPage++;
	updateTable();
	updatePagination();
	}
	});

	// 初始加载
	updateStats();
	updateRequests();

	// 定时刷新
	setInterval(updateStats, 5000);
	setInterval(updateRequests, 5000);
	</script>
	</body>
	</html>`;
	}

	/**
	* 处理 Dashboard 监控页面请求
	* 返回实时监控面板的HTML页面
	* @param request HTTP请求对象
	* @returns Promise<Response> HTML响应
	*/
	async function handleDashboard(request: Request): Promise<Response> {
	if (request.method !== "GET") {
	return new Response("Method not allowed", { status: 405 });
	}

	return new Response(getDashboardHTML(), {
	status: 200,
	headers: {
	"Content-Type": "text/html; charset=utf-8"
	}
	});
	}

	// 处理Dashboard统计数据
	async function handleDashboardStats(request: Request): Promise<Response> {
	return new Response(getStatsData(), {
	status: 200,
	headers: {
	"Content-Type": "application/json"
	}
	});
	}

	async function handleDashboardRequests(request: Request): Promise<Response> {
	return new Response(getLiveRequestsData(), {
	status: 200,
	headers: {
	"Content-Type": "application/json"
	}
	});
	}


	function getDocsHTML(): string {
	return `<!DOCTYPE html>
	<html lang="zh-CN">
	<head>
	<meta charset="UTF-8">
	<meta name="viewport" content="width=device-width, initial-scale=1.0">
	<title>ZtoApi 文档</title>
	<style>
	body {
	font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
	margin: 0;
	padding: 20px;
	background-color: #f5f5f5;
	line-height: 1.6;
	}
	.container {
	max-width: 1200px;
	margin: 0 auto;
	background-color: white;
	border-radius: 8px;
	box-shadow: 0 2px 10px rgba(0,0,0,0.1);
	padding: 30px;
	}
	h1 {
	color: #333;
	text-align: center;
	margin-bottom: 30px;
	border-bottom: 2px solid #007bff;
	padding-bottom: 10px;
	}
	h2 {
	color: #007bff;
	margin-top: 30px;
	margin-bottom: 15px;
	}
	h3 {
	color: #333;
	margin-top: 25px;
	margin-bottom: 10px;
	}
	.endpoint {
	background-color: #f8f9fa;
	border-radius: 6px;
	padding: 15px;
	margin-bottom: 20px;
	border-left: 4px solid #007bff;
	}
	.method {
	display: inline-block;
	padding: 4px 8px;
	border-radius: 4px;
	color: white;
	font-weight: bold;
	margin-right: 10px;
	font-size: 14px;
	}
	.get { background-color: #28a745; }
	.post { background-color: #007bff; }
	.path {
	font-family: monospace;
	background-color: #e9ecef;
	padding: 2px 6px;
	border-radius: 3px;
	font-size: 16px;
	}
	.description {
	margin: 15px 0;
	}
	.parameters {
	margin: 15px 0;
	}
	table {
	width: 100%;
	border-collapse: collapse;
	margin: 15px 0;
	}
	th, td {
	padding: 10px;
	text-align: left;
	border-bottom: 1px solid #ddd;
	}
	th {
	background-color: #f8f9fa;
	font-weight: bold;
	}
	.example {
	background-color: #f8f9fa;
	border-radius: 6px;
	padding: 15px;
	margin: 15px 0;
	font-family: monospace;
	white-space: pre-wrap;
	overflow-x: auto;
	}
	.note {
	background-color: #fff3cd;
	border-left: 4px solid #ffc107;
	padding: 10px 15px;
	margin: 15px 0;
	border-radius: 0 4px 4px 0;
	}
	.response {
	background-color: #f8f9fa;
	border-radius: 6px;
	padding: 15px;
	margin: 15px 0;
	font-family: monospace;
	white-space: pre-wrap;
	overflow-x: auto;
	}
	.tab {
	overflow: hidden;
	border: 1px solid #ccc;
	background-color: #f1f1f1;
	border-radius: 4px 4px 0 0;
	}
	.tab button {
	background-color: inherit;
	float: left;
	border: none;
	outline: none;
	cursor: pointer;
	padding: 14px 16px;
	transition: 0.3s;
	font-size: 16px;
	}
	.tab button:hover {
	background-color: #ddd;
	}
	.tab button.active {
	background-color: #ccc;
	}
	.tabcontent {
	display: none;
	padding: 6px 12px;
	border: 1px solid #ccc;
	border-top: none;
	border-radius: 0 0 4px 4px;
	}
	.toc {
	background-color: #f8f9fa;
	border-radius: 6px;
	padding: 15px;
	margin-bottom: 20px;
	}
	.toc ul {
	padding-left: 20px;
	}
	.toc li {
	margin: 5px 0;
	}
	.toc a {
	color: #007bff;
	text-decoration: none;
	}
	.toc a:hover {
	text-decoration: underline;
	}
	</style>
	</head>
	<body>
	<div class="container">
	<h1>ZtoApi 文档</h1>

	<div class="toc">
	<h2>目录</h2>
	<ul>
	<li><a href="#overview">概述</a></li>
	<li><a href="#authentication">身份验证</a></li>
	<li><a href="#endpoints">API端点</a>
	<ul>
	<li><a href="#models">获取模型列表</a></li>
	<li><a href="#chat-completions">聊天完成</a></li>
	</ul>
	</li>
	<li><a href="#examples">使用示例</a></li>
	<li><a href="#error-handling">错误处理</a></li>
	</ul>
	</div>

	<section id="overview">
	<h2>概述</h2>
	<p>这是一个为Z.ai GLM-4.5模型提供OpenAI兼容API接口的代理服务器。它允许你使用标准的OpenAI API格式与Z.ai的GLM-4.5模型进行交互，支持流式和非流式响应。</p>
	<p><strong>基础URL:</strong> <code>http://localhost:9090/v1</code></p>
	<div class="note">
	<strong>注意:</strong> 默认端口为9090，可以通过环境变量PORT进行修改。
	</div>
	</section>

	<section id="authentication">
	<h2>身份验证</h2>
	<p>所有API请求都需要在请求头中包含有效的API密钥进行身份验证：</p>
	<div class="example">
	Authorization: Bearer your-api-key</div>
	<p>默认的API密钥为 <code>sk-your-key</code>，可以通过环境变量 <code>DEFAULT_KEY</code> 进行修改。</p>
	</section>

	<section id="endpoints">
	<h2>API端点</h2>

	<div class="endpoint" id="models">
	<h3>获取模型列表</h3>
	<div>
	<span class="method get">GET</span>
	<span class="path">/v1/models</span>
	</div>
	<div class="description">
	<p>获取可用模型列表。</p>
	</div>
	<div class="parameters">
	<h4>请求参数</h4>
	<p>无</p>
	</div>
	<div class="response">
	{
	"object": "list",
	"data": [
	{
	"id": "GLM-4.5",
	"object": "model",
	"created": 1756788845,
	"owned_by": "z.ai"
	}
	]
	}</div>
	</div>

	<div class="endpoint" id="chat-completions">
	<h3>聊天完成</h3>
	<div>
	<span class="method post">POST</span>
	<span class="path">/v1/chat/completions</span>
	</div>
	<div class="description">
	<p>基于消息列表生成模型响应。支持流式和非流式两种模式。</p>
	</div>
	<div class="parameters">
	<h4>请求参数</h4>
	<table>
	<thead>
	<tr>
	<th>参数名</th>
	<th>类型</th>
	<th>必需</th>
	<th>说明</th>
	</tr>
	</thead>
	<tbody>
	<tr>
	<td>model</td>
	<td>string</td>
	<td>是</td>
	<td>要使用的模型ID，例如 "GLM-4.5"</td>
	</tr>
	<tr>
	<td>messages</td>
	<td>array</td>
	<td>是</td>
	<td>消息列表，包含角色和内容</td>
	</tr>
	<tr>
	<td>stream</td>
	<td>boolean</td>
	<td>否</td>
	<td>是否使用流式响应，默认为true</td>
	</tr>
	<tr>
	<td>temperature</td>
	<td>number</td>
	<td>否</td>
	<td>采样温度，控制随机性</td>
	</tr>
	<tr>
	<td>max_tokens</td>
	<td>integer</td>
	<td>否</td>
	<td>生成的最大令牌数</td>
	</tr>
	</tbody>
	</table>
	</div>
	<div class="parameters">
	<h4>消息格式</h4>
	<table>
	<thead>
	<tr>
	<th>字段</th>
	<th>类型</th>
	<th>说明</th>
	</tr>
	</thead>
	<tbody>
	<tr>
	<td>role</td>
	<td>string</td>
	<td>消息角色，可选值：system、user、assistant</td>
	</tr>
	<tr>
	<td>content</td>
	<td>string</td>
	<td>消息内容</td>
	</tr>
	</tbody>
	</table>
	</div>
	</div>
	</section>

	<section id="examples">
	<h2>使用示例</h2>

	<div class="tab">
	<button class="tablinks active" onclick="openTab(event, 'python-tab')">Python</button>
	<button class="tablinks" onclick="openTab(event, 'curl-tab')">cURL</button>
	<button class="tablinks" onclick="openTab(event, 'javascript-tab')">JavaScript</button>
	</div>

	<div id="python-tab" class="tabcontent" style="display: block;">
	<h3>Python示例</h3>
	<div class="example">
	import openai

	# 配置客户端
	client = openai.OpenAI(
	api_key="your-api-key", # 对应 DEFAULT_KEY
	base_url="http://localhost:9090/v1"
	)

	# 非流式请求 - 使用GLM-4.5
	response = client.chat.completions.create(
	model="GLM-4.5",
	messages=[{"role": "user", "content": "你好，请介绍一下自己"}]
	)

	print(response.choices[0].message.content)


	# 流式请求 - 使用GLM-4.5
	response = client.chat.completions.create(
	model="GLM-4.5",
	messages=[{"role": "user", "content": "请写一首关于春天的诗"}],
	stream=True
	)


	for chunk in response:
	if chunk.choices[0].delta.content:
	print(chunk.choices[0].delta.content, end="")</div>
	</div>

	<div id="curl-tab" class="tabcontent">
	<h3>cURL示例</h3>
	<div class="example">
	# 非流式请求
	curl -X POST http://localhost:9090/v1/chat/completions \
	-H "Content-Type: application/json" \
	-H "Authorization: Bearer your-api-key" \
	-d '{
	"model": "GLM-4.5",
	"messages": [{"role": "user", "content": "你好"}],
	"stream": false
	}'

	# 流式请求
	curl -X POST http://localhost:9090/v1/chat/completions \
	-H "Content-Type: application/json" \
	-H "Authorization: Bearer your-api-key" \
	-d '{
	"model": "GLM-4.5",
	"messages": [{"role": "user", "content": "你好"}],
	"stream": true
	}'</div>
	</div>

	<div id="javascript-tab" class="tabcontent">
	<h3>JavaScript示例</h3>
	<div class="example">
	const fetch = require('node-fetch');

	async function chatWithGLM(message, stream = false) {
	const response = await fetch('http://localhost:9090/v1/chat/completions', {
	method: 'POST',
	headers: {
	'Content-Type': 'application/json',
	'Authorization': 'Bearer your-api-key'
	},
	body: JSON.stringify({
	model: 'GLM-4.5',
	messages: [{ role: 'user', content: message }],
	stream: stream
	})
	});

	if (stream) {
	// 处理流式响应
	const reader = response.body.getReader();
	const decoder = new TextDecoder();

	while (true) {
	const { done, value } = await reader.read();
	if (done) break;

	const chunk = decoder.decode(value);
	const lines = chunk.split('\n');

	for (const line of lines) {
	if (line.startsWith('data: ')) {
	const data = line.slice(6);
	if (data === '[DONE]') {
	console.log('\n流式响应完成');
	return;
	}

	try {
	const parsed = JSON.parse(data);
	const content = parsed.choices[0]?.delta?.content;
	if (content) {
	process.stdout.write(content);
	}
	} catch (e) {
	// 忽略解析错误
	}
	}
	}
	}
	} else {
	// 处理非流式响应
	const data = await response.json();
	console.log(data.choices[0].message.content);
	}
	}

	// 使用示例
	chatWithGLM('你好，请介绍一下JavaScript', false);</div>
	</div>
	</section>

	<section id="error-handling">
	<h2>错误处理</h2>
	<p>API使用标准HTTP状态码来表示请求的成功或失败：</p>
	<table>
	<thead>
	<tr>
	<th>状态码</th>
	<th>说明</th>
	</tr>
	</thead>
	<tbody>
	<tr>
	<td>200 OK</td>
	<td>请求成功</td>
	</tr>
	<tr>
	<td>400 Bad Request</td>
	<td>请求格式错误或参数无效</td>
	</tr>
	<tr>
	<td>401 Unauthorized</td>
	<td>API密钥无效或缺失</td>
	</tr>
	<tr>
	<td>502 Bad Gateway</td>
	<td>上游服务错误</td>
	</tr>
	</tbody>
	</table>
	<div class="note">
	<strong>注意:</strong> 在调试模式下，服务器会输出详细的日志信息，可以通过设置环境变量 DEBUG_MODE=true 来启用。
	</div>
	</section>
	</div>

	<script>
	function openTab(evt, tabName) {
	var i, tabcontent, tablinks;
	tabcontent = document.getElementsByClassName("tabcontent");
	for (i = 0; i < tabcontent.length; i++) {
	tabcontent[i].style.display = "none";
	}
	tablinks = document.getElementsByClassName("tablinks");
	for (i = 0; i < tablinks.length; i++) {
	tablinks[i].className = tablinks[i].className.replace(" active", "");
	}
	document.getElementById(tabName).style.display = "block";
	evt.currentTarget.className += " active";
	}
	</script>
	</body>
	</html>`;
	}

	// 处理API文档页面
	async function handleDocs(request: Request): Promise<Response> {
	if (request.method !== "GET") {
	return new Response("Method not allowed", { status: 405 });
	}

	return new Response(getDocsHTML(), {
	status: 200,
	headers: {
	"Content-Type": "text/html; charset=utf-8"
	}
	});
	}

	// 主HTTP服务器
	async function main() {
	console.log(`OpenAI兼容API服务器启动`);
	console.log(`支持的模型: ${SUPPORTED_MODELS.map(m => `${m.id} (${m.name})`).join(', ')}`);
	console.log(`上游: ${UPSTREAM_URL}`);
	console.log(`Debug模式: ${DEBUG_MODE}`);
	console.log(`默认流式响应: ${DEFAULT_STREAM}`);
	console.log(`Dashboard启用: ${DASHBOARD_ENABLED}`);

	// 检测是否在Deno Deploy上运行
	const isDenoDeploy = Deno.env.get("DENO_DEPLOYMENT_ID") !== undefined;

	if (isDenoDeploy) {
	// Deno Deploy环境
	console.log("运行在Deno Deploy环境中");
	Deno.serve(handleRequest,{ port: 7860 });
	} else {
	// 本地或自托管环境
	const port = parseInt(Deno.env.get("PORT") \|\| "7860");
	console.log(`运行在本地环境中，端口: ${port}`);

	if (DASHBOARD_ENABLED) {
	console.log(`Dashboard已启用，访问地址: http://localhost:${port}/dashboard`);
	}

	const server = Deno.listen({ port });

	for await (const conn of server) {
	handleHttp(conn);
	}
	}
	}

	// 处理HTTP连接（用于本地环境）
	async function handleHttp(conn: Deno.Conn) {
	const httpConn = Deno.serveHttp(conn);

	while (true) {
	const requestEvent = await httpConn.nextRequest();
	if (!requestEvent) break;

	const { request, respondWith } = requestEvent;
	const url = new URL(request.url);
	const startTime = Date.now();
	const userAgent = request.headers.get("User-Agent") \|\| "";

	try {
	// 路由分发
	if (url.pathname === "/") {
	const response = await handleIndex(request);
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	} else if (url.pathname === "/v1/models") {
	const response = await handleModels(request);
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	} else if (url.pathname === "/v1/chat/completions") {
	const response = await handleChatCompletions(request);
	await respondWith(response);
	// 请求统计已在handleChatCompletions中记录
	} else if (url.pathname === "/docs") {
	const response = await handleDocs(request);
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	} else if (url.pathname === "/dashboard" && DASHBOARD_ENABLED) {
	const response = await handleDashboard(request);
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	} else if (url.pathname === "/dashboard/stats" && DASHBOARD_ENABLED) {
	const response = await handleDashboardStats(request);
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	} else if (url.pathname === "/dashboard/requests" && DASHBOARD_ENABLED) {
	const response = await handleDashboardRequests(request);
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	} else {
	const response = await handleOptions(request);
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	}
	} catch (error) {
	debugLog("处理请求时出错: %v", error);
	const response = new Response("Internal Server Error", { status: 500 });
	await respondWith(response);
	recordRequestStats(startTime, url.pathname, 500);
	addLiveRequest(request.method, url.pathname, 500, Date.now() - startTime, userAgent);
	}
	}
	}

	// 处理HTTP请求（用于Deno Deploy环境）
	async function handleRequest(request: Request): Promise<Response> {
	const url = new URL(request.url);
	const startTime = Date.now();
	const userAgent = request.headers.get("User-Agent") \|\| "";

	try {
	// 路由分发
	if (url.pathname === "/") {
	const response = await handleIndex(request);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	return response;
	} else if (url.pathname === "/v1/models") {
	const response = await handleModels(request);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	return response;
	} else if (url.pathname === "/v1/chat/completions") {
	const response = await handleChatCompletions(request);
	// 请求统计已在handleChatCompletions中记录
	return response;
	} else if (url.pathname === "/docs") {
	const response = await handleDocs(request);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	return response;
	} else if (url.pathname === "/dashboard" && DASHBOARD_ENABLED) {
	const response = await handleDashboard(request);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	return response;
	} else if (url.pathname === "/dashboard/stats" && DASHBOARD_ENABLED) {
	const response = await handleDashboardStats(request);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	return response;
	} else if (url.pathname === "/dashboard/requests" && DASHBOARD_ENABLED) {
	const response = await handleDashboardRequests(request);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	return response;
	} else {
	const response = await handleOptions(request);
	recordRequestStats(startTime, url.pathname, response.status);
	addLiveRequest(request.method, url.pathname, response.status, Date.now() - startTime, userAgent);
	return response;
	}
	} catch (error) {
	debugLog("处理请求时出错: %v", error);
	recordRequestStats(startTime, url.pathname, 500);
	addLiveRequest(request.method, url.pathname, 500, Date.now() - startTime, userAgent);
	return new Response("Internal Server Error", { status: 500 });
	}
	}

	// 启动服务器
	main();