forked from CherryHQ/cherry-studio-app
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathModelHealthService.ts
More file actions
114 lines (97 loc) · 3.2 KB
/
ModelHealthService.ts
File metadata and controls
114 lines (97 loc) · 3.2 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
import type { Model, ModelHealth, Provider } from '@/types/assistant'
import { checkApi } from './ApiService'
import { loggerService } from './LoggerService'
const logger = loggerService.withContext('ModelHealthService')
export type ModelHealthCheckResult = ModelHealth
function extractErrorMessage(error: unknown): string {
let errorMessage = 'Unknown error'
if (error instanceof Error) {
errorMessage = error.message
if ((error as any).status) {
errorMessage = `HTTP ${(error as any).status}: ${errorMessage}`
}
} else if (typeof error === 'string') {
errorMessage = error
}
return errorMessage
}
/**
* Check health of a single model
* @param provider Provider to test
* @param model Model to test
* @param timeoutMs Timeout in milliseconds (default: 30000)
* @returns ModelHealth result
*/
export async function checkModelHealth(
provider: Provider,
model: Model,
timeoutMs: number = 30000
): Promise<ModelHealth> {
const startTime = Date.now()
try {
// Create a timeout promise
const timeoutPromise = new Promise<never>((_, reject) => {
setTimeout(() => reject(new Error('Health check timeout')), timeoutMs)
})
// Race between the actual check and timeout
await Promise.race([checkApi(provider, model), timeoutPromise])
const endTime = Date.now()
const latency = (endTime - startTime) / 1000 // Convert to seconds
return {
modelId: model.id,
status: 'healthy',
latency,
lastChecked: Date.now()
}
} catch (error) {
const endTime = Date.now()
const latency = (endTime - startTime) / 1000
logger.error(`Health check failed for model ${model.id}:`, error as Error)
// Extract meaningful error message
const errorMessage = extractErrorMessage(error)
return {
modelId: model.id,
status: 'unhealthy',
latency,
lastChecked: Date.now(),
error: errorMessage
}
}
}
/**
* Check health of multiple models in parallel
* @param provider Provider to test
* @param models Models to test
* @param timeoutMs Timeout in milliseconds for each model (default: 30000)
* @returns Array of ModelHealth results
*/
export async function checkModelsHealth(
provider: Provider,
models: Model[],
timeoutMs: number = 30000
): Promise<ModelHealth[]> {
logger.info(`Starting health check for ${models.length} models`)
// Create promises for all model checks
const checkPromises = models.map(model => checkModelHealth(provider, model, timeoutMs))
// Wait for all checks to complete (using allSettled to handle individual failures)
const results = await Promise.allSettled(checkPromises)
// Extract successful results and handle failures
return results.map((result, index) => {
if (result.status === 'fulfilled') {
return result.value
} else {
// If the check itself failed (not the API call), return an unhealthy status
logger.error(`Failed to check health for model ${models[index].id}:`, result.reason)
return {
modelId: models[index].id,
status: 'unhealthy',
lastChecked: Date.now(),
error: extractErrorMessage(result.reason)
}
}
})
}
export const modelHealthService = {
checkModelHealth,
checkModelsHealth
}