update at 2025-10-14 21:52:11

This commit is contained in:
douboer
2025-10-14 21:52:11 +08:00
parent ac3ed480ab
commit 4f5eea604e
40 changed files with 15231 additions and 126 deletions

View File

@@ -0,0 +1,954 @@
export interface ModelService {
id: string
name: string
type: 'openai' | 'claude' | 'gemini' | 'azure' | 'local' | 'dashscope' | 'volcengine' | 'custom'
url: string
apiKey: string
status: 'connected' | 'disconnected' | 'connecting' | 'error'
models?: string[]
lastUsed?: Date
customConfig?: string
errorMessage?: string
}
export interface ApiResponse<T = any> {
success: boolean
data?: T
error?: string
}
export class ModelServiceManager {
private services: Map<string, ModelService> = new Map()
private static instance: ModelServiceManager
static getInstance(): ModelServiceManager {
if (!ModelServiceManager.instance) {
ModelServiceManager.instance = new ModelServiceManager()
// 自动加载保存的服务
ModelServiceManager.instance.loadFromModelStore()
}
return ModelServiceManager.instance
}
// 从 modelStore (localStorage) 加载服务配置
loadFromModelStore(): void {
try {
const saved = localStorage.getItem('model-providers')
if (!saved) {
console.log('🔍 [loadFromModelStore] 没有找到保存的服务')
return
}
const providers = JSON.parse(saved)
console.log('🔍 [loadFromModelStore] 加载服务:', providers.length, '个')
providers.forEach((provider: any) => {
// 将 modelStore 的 provider 格式转换为 ModelService 格式
// 关键判断逻辑:
// 1. enabled === true (明确启用)
// 2. connected === true (已连接)
// 3. 如果两者都是 undefined,但有 apiKey,也认为是可用的
const isEnabled = provider.enabled === true || provider.connected === true
const hasApiKey = provider.apiKey && provider.apiKey.length > 0
const shouldConnect = isEnabled || (provider.enabled !== false && hasApiKey)
// 解析模型列表
let modelList: string[] = []
if (provider.models && Array.isArray(provider.models)) {
modelList = provider.models.map((m: any) =>
typeof m === 'string' ? m : (m.id || m.name || '')
).filter((m: string) => m.length > 0)
}
const service: ModelService = {
id: provider.id,
name: provider.name,
type: this.mapProviderType(provider.type),
url: provider.baseUrl || provider.url || '',
apiKey: provider.apiKey || '',
status: shouldConnect ? 'connected' : 'disconnected',
models: modelList
}
this.services.set(service.id, service)
console.log('🔍 [loadFromModelStore] 添加服务:', {
name: service.name,
enabled: provider.enabled,
connected: provider.connected,
hasApiKey,
shouldConnect,
status: service.status,
模型数: service.models?.length,
前3个模型: service.models?.slice(0, 3)
})
})
} catch (error) {
console.error('❌ [loadFromModelStore] 加载失败:', error)
}
}
// 映射 provider type 到 service type
private mapProviderType(type: string): ModelService['type'] {
const map: Record<string, ModelService['type']> = {
'openai': 'openai',
'claude': 'claude',
'google': 'gemini',
'ollama': 'local',
'volcengine': 'volcengine', // 火山引擎
'dashscope': 'dashscope', // 阿里云通义千问
'azure': 'azure',
'local': 'local',
'custom': 'custom'
}
const mapped = map[type] || 'custom'
console.log('🔍 [mapProviderType]', type, '→', mapped)
return mapped
}
// 测试服务连接
async testConnection(service: ModelService): Promise<ApiResponse<{ models: string[] }>> {
try {
const models = await this.fetchModels(service)
return {
success: true,
data: { models }
}
} catch (error) {
return {
success: false,
error: error instanceof Error ? error.message : '连接失败'
}
}
}
// 测试服务连接(用于预定义模型列表的服务)
private async testServiceConnection(service: ModelService): Promise<void> {
const headers: HeadersInit = {
'Content-Type': 'application/json'
}
// 设置认证头
switch (service.type) {
case 'volcengine':
case 'openai':
case 'local':
case 'dashscope':
headers['Authorization'] = `Bearer ${service.apiKey}`
break
case 'claude':
headers['x-api-key'] = service.apiKey
headers['anthropic-version'] = '2023-06-01'
break
}
const controller = new AbortController()
const timeoutId = setTimeout(() => controller.abort(), 10000)
try {
// 发送一个简单的测试请求
const testUrl = `${service.url}/chat/completions`
const response = await fetch(testUrl, {
method: 'POST',
headers,
signal: controller.signal,
body: JSON.stringify({
model: service.type === 'volcengine' ? 'doubao-lite-4k' : 'test',
messages: [{ role: 'user', content: 'hi' }],
max_tokens: 1
})
})
clearTimeout(timeoutId)
// 只要不是认证错误就算通过
if (response.status === 401 || response.status === 403) {
const errorText = await response.text()
throw new Error(`认证失败: ${errorText}`)
}
} catch (error) {
clearTimeout(timeoutId)
if (error instanceof Error) {
if (error.name === 'AbortError') {
throw new Error('连接超时')
}
throw error
}
throw new Error('连接测试失败')
}
}
// 获取可用模型列表
private async fetchModels(service: ModelService): Promise<string[]> {
// 某些服务使用预定义模型列表,不需要 API 调用
const url = this.getModelsEndpoint(service)
if (!url) {
// 对于使用预定义模型列表的服务,发送一个测试请求验证连接
await this.testServiceConnection(service)
// 返回预定义模型列表
return this.parseModelsResponse({}, service.type)
}
const headers: HeadersInit = {
'Content-Type': 'application/json'
}
// 根据服务类型设置认证头
switch (service.type) {
case 'openai':
case 'local':
case 'dashscope':
case 'volcengine':
headers['Authorization'] = `Bearer ${service.apiKey}`
break
case 'claude':
headers['x-api-key'] = service.apiKey
headers['anthropic-version'] = '2023-06-01'
break
case 'gemini':
// Gemini使用URL参数传递API密钥
break
case 'azure':
headers['api-key'] = service.apiKey
break
case 'custom':
// 解析自定义配置
try {
const config = JSON.parse(service.customConfig || '{}')
Object.assign(headers, config.headers || {})
} catch (e) {
console.warn('自定义配置解析失败:', e)
}
break
}
const controller = new AbortController()
const timeoutId = setTimeout(() => controller.abort(), 10000) // 10秒超时
try {
const response = await fetch(url, {
method: 'GET',
headers,
signal: controller.signal
})
clearTimeout(timeoutId)
if (!response.ok) {
const errorText = await response.text()
throw new Error(`HTTP ${response.status}: ${errorText}`)
}
const data = await response.json()
return this.parseModelsResponse(data, service.type)
} catch (error) {
clearTimeout(timeoutId)
if (error instanceof Error) {
if (error.name === 'AbortError') {
throw new Error('连接超时')
}
throw error
}
throw new Error('未知错误')
}
}
// 获取模型列表API端点
private getModelsEndpoint(service: ModelService): string {
switch (service.type) {
case 'openai':
case 'local':
return `${service.url}/models`
case 'dashscope':
// 阿里云 DashScope 使用 /models 端点
return `${service.url}/models`
case 'volcengine':
// 火山引擎使用预定义模型列表API 不提供 /models 端点)
return ''
case 'claude':
// Claude API 没有公开的模型列表端点,返回预定义模型
return ''
case 'gemini':
return `${service.url}/models?key=${service.apiKey}`
case 'azure':
// Azure OpenAI 使用不同的端点格式
const azureUrl = service.url.replace(/\/$/, '')
return `${azureUrl}/openai/deployments?api-version=2023-12-01-preview`
case 'custom':
return `${service.url}/models`
default:
return `${service.url}/models`
}
}
// 解析不同服务的模型响应
private parseModelsResponse(data: any, type: string): string[] {
switch (type) {
case 'openai':
case 'local':
if (data.data && Array.isArray(data.data)) {
return data.data.map((model: any) => model.id).filter(Boolean)
}
break
case 'dashscope':
// 阿里云 DashScope 格式
if (data.data && Array.isArray(data.data)) {
return data.data.map((model: any) => model.id || model.model_id).filter(Boolean)
}
// 如果返回格式不同,尝试其他可能的格式
if (data.models && Array.isArray(data.models)) {
return data.models.map((model: any) => model.id || model.model_id || model.name).filter(Boolean)
}
break
case 'volcengine':
// 火山引擎推荐模型列表
// 参考: https://www.volcengine.com/docs/82379/1330310
return [
// DeepSeek-V3 系列 - 深度思考模型
'deepseek-v3-1-terminus', // DeepSeek V3.1 terminus版本
'deepseek-v3-1-250821', // DeepSeek V3.1 250821版本
// Doubao Seed 1.6 系列 - 深度思考模型(推荐)
'doubao-seed-1-6-vision-250815', // 多模态深度思考(图片+视频+GUI)
'doubao-seed-1-6-250615', // 纯文本深度思考
'doubao-seed-1-6-flash-250828', // 快速多模态深度思考
'doubao-seed-1-6-thinking-250715', // 纯思考模型
]
case 'claude':
// Claude 预定义模型列表
return [
'claude-3-5-sonnet-20241022',
'claude-3-haiku-20240307',
'claude-3-sonnet-20240229',
'claude-3-opus-20240229'
]
case 'gemini':
if (data.models && Array.isArray(data.models)) {
return data.models
.map((model: any) => model.name?.replace('models/', ''))
.filter(Boolean)
}
break
case 'azure':
if (data.data && Array.isArray(data.data)) {
return data.data.map((deployment: any) => deployment.id).filter(Boolean)
}
break
case 'custom':
// 尝试多种可能的响应格式
if (data.models && Array.isArray(data.models)) {
return data.models.map((m: any) => typeof m === 'string' ? m : m.id || m.name).filter(Boolean)
}
if (data.data && Array.isArray(data.data)) {
return data.data.map((m: any) => typeof m === 'string' ? m : m.id || m.name).filter(Boolean)
}
if (Array.isArray(data)) {
return data.map((m: any) => typeof m === 'string' ? m : m.id || m.name).filter(Boolean)
}
break
}
return []
}
// 发送聊天请求
async sendChatRequest(serviceId: string, messages: any[], model: string): Promise<ApiResponse<any>> {
const startTime = performance.now()
console.log('⏱️ [sendChatRequest] 开始请求', { serviceId, model, messages数量: messages.length })
const service = this.services.get(serviceId)
console.log('🔍 [sendChatRequest] serviceId:', serviceId, 'service:', service)
if (!service || service.status !== 'connected') {
return {
success: false,
error: '服务未连接'
}
}
// 检查URL是否有效
if (!service.url || !service.url.startsWith('http')) {
console.error('❌ [sendChatRequest] 无效的服务URL:', service.url)
return {
success: false,
error: `服务URL无效: ${service.url}`
}
}
try {
const beforeRequest = performance.now()
console.log('⏱️ [sendChatRequest] 准备耗时:', (beforeRequest - startTime).toFixed(2), 'ms')
const response = await this.makeChatRequest(service, messages, model)
const afterRequest = performance.now()
console.log('⏱️ [sendChatRequest] 请求耗时:', (afterRequest - beforeRequest).toFixed(2), 'ms')
console.log('⏱️ [sendChatRequest] 总耗时:', (afterRequest - startTime).toFixed(2), 'ms')
return {
success: true,
data: response
}
} catch (error) {
console.error('❌ [sendChatRequest] 请求异常:', error)
return {
success: false,
error: error instanceof Error ? error.message : '请求失败'
}
}
}
// 发送流式聊天请求
async sendChatRequestStream(
serviceId: string,
messages: any[],
model: string,
onChunk: (chunk: string) => void,
tools?: any[]
): Promise<ApiResponse<{ toolCalls?: any[] }>> {
const startTime = performance.now()
console.log('🚀🚀🚀 [sendChatRequestStream] === 进入流式请求方法 ===')
console.log('⏱️ [sendChatRequestStream] 开始流式请求', { serviceId, model, messages数量: messages.length })
const service = this.services.get(serviceId)
if (!service || service.status !== 'connected') {
return {
success: false,
error: '服务未连接'
}
}
if (!service.url || !service.url.startsWith('http')) {
return {
success: false,
error: `服务URL无效: ${service.url}`
}
}
try {
const toolCalls = await this.makeChatRequestStream(service, messages, model, onChunk, tools)
const endTime = performance.now()
console.log('⏱️ [sendChatRequestStream] 流式请求完成,总耗时:', (endTime - startTime).toFixed(2), 'ms')
return {
success: true,
data: { toolCalls }
}
} catch (error) {
console.error('❌ [sendChatRequestStream] 流式请求异常:', error)
return {
success: false,
error: error instanceof Error ? error.message : '流式请求失败'
}
}
}
// 实际的聊天请求
private async makeChatRequest(service: ModelService, messages: any[], model: string): Promise<any> {
const requestStartTime = performance.now()
const headers: HeadersInit = {
'Content-Type': 'application/json'
}
let url = ''
let body: any = {}
console.log('🔍 [makeChatRequest] 服务信息:', {
type: service.type,
name: service.name,
url: service.url,
model
})
switch (service.type) {
case 'openai':
case 'local':
headers['Authorization'] = `Bearer ${service.apiKey}`
url = `${service.url}/chat/completions`
body = {
model,
messages,
stream: false
}
break
case 'dashscope':
headers['Authorization'] = `Bearer ${service.apiKey}`
url = `${service.url}/chat/completions`
body = {
model,
messages,
stream: false
}
break
case 'volcengine':
headers['Authorization'] = `Bearer ${service.apiKey}`
url = `${service.url}/chat/completions`
body = {
model,
messages,
stream: false
}
break
case 'claude':
headers['x-api-key'] = service.apiKey
headers['anthropic-version'] = '2023-06-01'
url = `${service.url}/messages`
body = {
model,
messages: this.convertToClaudeFormat(messages),
max_tokens: 4096
}
break
case 'gemini':
url = `${service.url}/models/${model}:generateContent?key=${service.apiKey}`
body = {
contents: this.convertToGeminiFormat(messages)
}
break
case 'azure':
headers['api-key'] = service.apiKey
url = `${service.url}/openai/deployments/${model}/chat/completions?api-version=2023-12-01-preview`
body = {
messages,
stream: false
}
break
case 'custom':
try {
const config = JSON.parse(service.customConfig || '{}')
Object.assign(headers, config.headers || {})
} catch (e) {
console.warn('自定义配置解析失败:', e)
}
url = `${service.url}/chat/completions`
body = {
model,
messages,
stream: false
}
break
}
console.log('🔍 [makeChatRequest] 最终请求URL:', url)
console.log('🔍 [makeChatRequest] 请求体大小:', JSON.stringify(body).length, '字节')
const beforeFetch = performance.now()
console.log('⏱️ [makeChatRequest] 构建请求耗时:', (beforeFetch - requestStartTime).toFixed(2), 'ms')
// 添加30秒超时控制
const controller = new AbortController()
const timeoutId = setTimeout(() => controller.abort(), 30000)
try {
const response = await fetch(url, {
method: 'POST',
headers,
body: JSON.stringify(body),
signal: controller.signal
})
clearTimeout(timeoutId)
const afterFetch = performance.now()
console.log('⏱️ [makeChatRequest] 网络请求耗时:', (afterFetch - beforeFetch).toFixed(2), 'ms')
console.log('🔍 [makeChatRequest] 响应状态:', response.status, response.statusText)
if (!response.ok) {
const errorText = await response.text()
console.error('❌ [makeChatRequest] 请求失败:', {
status: response.status,
statusText: response.statusText,
url,
errorText
})
throw new Error(`HTTP ${response.status}: ${errorText}`)
}
const beforeParse = performance.now()
const result = await response.json()
const afterParse = performance.now()
console.log('⏱️ [makeChatRequest] 解析响应耗时:', (afterParse - beforeParse).toFixed(2), 'ms')
console.log('⏱️ [makeChatRequest] makeChatRequest总耗时:', (afterParse - requestStartTime).toFixed(2), 'ms')
return result
} catch (error) {
clearTimeout(timeoutId)
if (error instanceof Error && error.name === 'AbortError') {
throw new Error('请求超时(30秒)')
}
throw error
}
}
// 流式聊天请求
private async makeChatRequestStream(
service: ModelService,
messages: any[],
model: string,
onChunk: (text: string) => void,
tools?: any[]
): Promise<any[] | undefined> {
const requestStartTime = performance.now()
const headers: HeadersInit = {
'Content-Type': 'application/json'
}
let url = ''
let body: any = {}
// 构建请求 (与非流式相同,但 stream: true)
switch (service.type) {
case 'openai':
case 'local':
case 'dashscope':
case 'volcengine':
headers['Authorization'] = `Bearer ${service.apiKey}`
url = `${service.url}/chat/completions`
body = {
model,
messages,
stream: true, // ← 启用流式
...(tools && tools.length > 0 ? { tools, tool_choice: 'auto' } : {})
}
break
case 'claude':
headers['x-api-key'] = service.apiKey
headers['anthropic-version'] = '2023-06-01'
url = `${service.url}/messages`
body = {
model,
messages: this.convertToClaudeFormat(messages),
max_tokens: 4096,
stream: true
}
break
case 'azure':
headers['api-key'] = service.apiKey
url = `${service.url}/openai/deployments/${model}/chat/completions?api-version=2023-12-01-preview`
body = {
messages,
stream: true
}
break
default:
url = `${service.url}/chat/completions`
body = {
model,
messages,
stream: true
}
break
}
console.log('🔍 [makeChatRequestStream] 流式请求URL:', url)
console.log('🔍 [makeChatRequestStream] 流式请求体大小:', JSON.stringify(body).length, '字节')
const controller = new AbortController()
const timeoutId = setTimeout(() => controller.abort(), 60000) // 流式请求60秒超时
try {
const beforeFetch = performance.now()
console.log('⏱️ [makeChatRequestStream] 构建请求耗时:', (beforeFetch - requestStartTime).toFixed(2), 'ms')
const response = await fetch(url, {
method: 'POST',
headers,
body: JSON.stringify(body),
signal: controller.signal
})
clearTimeout(timeoutId)
if (!response.ok) {
const errorText = await response.text()
throw new Error(`HTTP ${response.status}: ${errorText}`)
}
const afterFetch = performance.now()
console.log('⏱️ [makeChatRequestStream] 首字节响应耗时:', (afterFetch - beforeFetch).toFixed(2), 'ms')
// 读取流
const reader = response.body?.getReader()
if (!reader) {
throw new Error('无法获取响应流')
}
console.log('🌊🌊🌊 [makeChatRequestStream] === 开始读取流数据 ===')
const decoder = new TextDecoder()
let buffer = ''
let chunkCount = 0
let totalChars = 0
const firstChunkTimeStart = performance.now()
let collectedToolCalls: any[] = []
const toolCallsMap = new Map<number, any>()
while (true) {
const { done, value } = await reader.read()
if (done) break
chunkCount++
if (chunkCount === 1) {
console.log('⚡⚡⚡ [makeChatRequestStream] 收到第一个数据块!耗时:', (performance.now() - firstChunkTimeStart).toFixed(2), 'ms')
}
buffer += decoder.decode(value, { stream: true })
const lines = buffer.split('\n')
buffer = lines.pop() || ''
for (const line of lines) {
if (line.trim() === '' || line.trim() === 'data: [DONE]') {
continue
}
if (line.startsWith('data: ')) {
try {
const data = JSON.parse(line.slice(6))
const delta = data.choices?.[0]?.delta
// 处理普通内容
const content = delta?.content
if (content) {
totalChars += content.length
onChunk(content)
}
// 处理工具调用
if (delta?.tool_calls) {
for (const toolCall of delta.tool_calls) {
const index = toolCall.index
if (!toolCallsMap.has(index)) {
toolCallsMap.set(index, {
id: toolCall.id || '',
type: toolCall.type || 'function',
function: {
name: toolCall.function?.name || '',
arguments: ''
}
})
}
const existing = toolCallsMap.get(index)!
if (toolCall.function?.name) {
existing.function.name = toolCall.function.name
}
if (toolCall.function?.arguments) {
existing.function.arguments += toolCall.function.arguments
}
}
}
} catch (e) {
// 忽略解析错误
}
}
}
}
// 收集所有工具调用
if (toolCallsMap.size > 0) {
collectedToolCalls = Array.from(toolCallsMap.values())
console.log('🔧 [makeChatRequestStream] 检测到工具调用:', collectedToolCalls.length, '个')
}
const endTime = performance.now()
console.log('⏱️ [makeChatRequestStream] 流式接收完成')
console.log('⏱️ [makeChatRequestStream] 接收块数:', chunkCount, '总字符数:', totalChars)
console.log('⏱️ [makeChatRequestStream] 流式总耗时:', (endTime - requestStartTime).toFixed(2), 'ms')
return collectedToolCalls.length > 0 ? collectedToolCalls : undefined
} catch (error) {
clearTimeout(timeoutId)
if (error instanceof Error && error.name === 'AbortError') {
throw new Error('流式请求超时(60秒)')
}
throw error
}
}
// 转换消息格式为Claude格式
private convertToClaudeFormat(messages: any[]): any[] {
return messages
.filter(msg => msg.role !== 'system')
.map(msg => ({
role: msg.role === 'assistant' ? 'assistant' : 'user',
content: msg.content
}))
}
// 转换消息格式为Gemini格式
private convertToGeminiFormat(messages: any[]): any[] {
return messages
.filter(msg => msg.role !== 'system')
.map(msg => ({
role: msg.role === 'assistant' ? 'model' : 'user',
parts: [{ text: msg.content }]
}))
}
// 添加服务
addService(service: ModelService): void {
this.services.set(service.id, service)
}
// 更新服务
updateService(service: ModelService): void {
this.services.set(service.id, service)
}
// 删除服务
removeService(serviceId: string): void {
this.services.delete(serviceId)
}
// 获取服务
getService(serviceId: string): ModelService | undefined {
return this.services.get(serviceId)
}
// 获取所有服务
getAllServices(): ModelService[] {
return Array.from(this.services.values())
}
// 连接服务
async connectService(serviceId: string): Promise<void> {
const service = this.services.get(serviceId)
if (!service) throw new Error('服务不存在')
service.status = 'connecting'
try {
const result = await this.testConnection(service)
if (result.success && result.data) {
service.status = 'connected'
service.models = result.data.models
service.errorMessage = undefined
service.lastUsed = new Date()
} else {
service.status = 'error'
service.errorMessage = result.error
throw new Error(result.error)
}
} catch (error) {
service.status = 'error'
service.errorMessage = error instanceof Error ? error.message : '连接失败'
throw error
}
}
// 断开服务
disconnectService(serviceId: string): void {
const service = this.services.get(serviceId)
if (service) {
service.status = 'disconnected'
service.models = []
service.errorMessage = undefined
}
}
// 健康检测 - 测试单个模型是否可用
async testModelHealth(service: ModelService, modelId: string): Promise<{
modelId: string
available: boolean
latency?: number
error?: string
}> {
const startTime = Date.now()
try {
// 发送一个最小的测试请求
const result = await this.sendChatRequest(service.id, [
{ role: 'user', content: 'hi' }
], modelId)
if (!result.success) {
throw new Error(result.error || '测试失败')
}
const latency = Date.now() - startTime
return {
modelId,
available: true,
latency
}
} catch (error) {
return {
modelId,
available: false,
error: error instanceof Error ? error.message : '测试失败'
}
}
}
// 批量健康检测 - 测试所有模型
async healthCheckAllModels(
service: ModelService,
onProgress?: (current: number, total: number, modelId: string) => void
): Promise<{
availableModels: string[]
unavailableModels: string[]
results: Array<{
modelId: string
available: boolean
latency?: number
error?: string
}>
}> {
const models = service.models || []
const results: Array<{
modelId: string
available: boolean
latency?: number
error?: string
}> = []
for (let i = 0; i < models.length; i++) {
const modelId = models[i]
// 通知进度
if (onProgress) {
onProgress(i + 1, models.length, modelId)
}
// 测试模型健康状态
const result = await this.testModelHealth(service, modelId)
results.push(result)
// 添加小延迟避免过快请求
if (i < models.length - 1) {
await new Promise(resolve => setTimeout(resolve, 200))
}
}
// 统计结果
const availableModels = results.filter(r => r.available).map(r => r.modelId)
const unavailableModels = results.filter(r => !r.available).map(r => r.modelId)
return {
availableModels,
unavailableModels,
results
}
}
}
// 导出单例实例
export const modelServiceManager = ModelServiceManager.getInstance()