2026-04-29 16:26:24 +08:00
|
|
|
import { io, type Socket } from 'socket.io-client'
|
2026-04-16 08:38:18 +08:00
|
|
|
import { request, getBaseUrlValue, getApiKey } from '../client'
|
2026-04-11 15:59:14 +08:00
|
|
|
|
|
|
|
|
export interface ChatMessage {
|
|
|
|
|
role: 'user' | 'assistant' | 'system'
|
|
|
|
|
content: string
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
export interface StartRunRequest {
|
|
|
|
|
input: string | ChatMessage[]
|
|
|
|
|
instructions?: string
|
|
|
|
|
session_id?: string
|
2026-04-12 23:23:50 +08:00
|
|
|
model?: string
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
export interface StartRunResponse {
|
|
|
|
|
run_id: string
|
|
|
|
|
status: string
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// SSE event types from /v1/runs/{id}/events
|
|
|
|
|
export interface RunEvent {
|
|
|
|
|
event: string
|
|
|
|
|
run_id?: string
|
|
|
|
|
delta?: string
|
2026-04-25 08:46:50 +08:00
|
|
|
/** Payload text for `reasoning.delta` / `thinking.delta` / `reasoning.available` events. */
|
|
|
|
|
text?: string
|
2026-04-11 15:59:14 +08:00
|
|
|
tool?: string
|
|
|
|
|
name?: string
|
|
|
|
|
preview?: string
|
|
|
|
|
timestamp?: number
|
|
|
|
|
error?: string
|
2026-04-25 16:21:07 +08:00
|
|
|
/** Final response text on `run.completed`. May be empty/null if the agent
|
|
|
|
|
* silently swallowed an upstream error — see chat store for fallback. */
|
|
|
|
|
output?: string | null
|
2026-04-22 16:14:50 +08:00
|
|
|
usage?: {
|
|
|
|
|
input_tokens: number
|
|
|
|
|
output_tokens: number
|
|
|
|
|
total_tokens: number
|
|
|
|
|
}
|
2026-04-29 16:26:24 +08:00
|
|
|
/** session_id tag added by server for client-side filtering */
|
|
|
|
|
session_id?: string
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// ============================
|
|
|
|
|
// Socket.IO chat run connection
|
|
|
|
|
// ============================
|
|
|
|
|
|
|
|
|
|
let chatRunSocket: Socket | null = null
|
|
|
|
|
|
|
|
|
|
export function getChatRunSocket(): Socket | null {
|
|
|
|
|
return chatRunSocket
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|
|
|
|
|
|
2026-04-29 16:26:24 +08:00
|
|
|
export function connectChatRun(): Socket {
|
|
|
|
|
if (chatRunSocket?.connected) return chatRunSocket
|
|
|
|
|
|
|
|
|
|
// Clean up old socket to prevent duplicate event listeners
|
|
|
|
|
if (chatRunSocket) {
|
|
|
|
|
chatRunSocket.removeAllListeners()
|
|
|
|
|
chatRunSocket.disconnect()
|
2026-04-26 17:47:39 +08:00
|
|
|
}
|
2026-04-29 16:26:24 +08:00
|
|
|
|
|
|
|
|
const baseUrl = getBaseUrlValue()
|
|
|
|
|
const token = getApiKey()
|
|
|
|
|
const profile = localStorage.getItem('hermes_active_profile_name') || 'default'
|
|
|
|
|
|
|
|
|
|
chatRunSocket = io(`${baseUrl}/chat-run`, {
|
|
|
|
|
auth: { token },
|
|
|
|
|
query: { profile },
|
|
|
|
|
transports: ['websocket', 'polling'],
|
|
|
|
|
reconnection: true,
|
|
|
|
|
reconnectionAttempts: Infinity,
|
|
|
|
|
reconnectionDelay: 1000,
|
|
|
|
|
reconnectionDelayMax: 10000,
|
2026-04-11 15:59:14 +08:00
|
|
|
})
|
2026-04-29 16:26:24 +08:00
|
|
|
|
|
|
|
|
return chatRunSocket
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
export function disconnectChatRun(): void {
|
|
|
|
|
if (chatRunSocket) {
|
|
|
|
|
chatRunSocket.disconnect()
|
|
|
|
|
chatRunSocket = null
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Start a chat run via Socket.IO and stream events back.
|
|
|
|
|
* Returns an AbortController-compatible handle for cancellation.
|
|
|
|
|
*/
|
|
|
|
|
/**
|
|
|
|
|
* Resume a session via Socket.IO. Returns messages, working status, and events.
|
|
|
|
|
*/
|
|
|
|
|
export function resumeSession(
|
|
|
|
|
sessionId: string,
|
|
|
|
|
onResumed: (data: { session_id: string; messages: any[]; isWorking: boolean; events: any[]; inputTokens?: number; outputTokens?: number }) => void,
|
|
|
|
|
): Socket {
|
|
|
|
|
const socket = connectChatRun()
|
|
|
|
|
|
|
|
|
|
socket.once('resumed', onResumed)
|
|
|
|
|
socket.emit('resume', { session_id: sessionId })
|
|
|
|
|
|
|
|
|
|
return socket
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|
|
|
|
|
|
2026-04-29 16:26:24 +08:00
|
|
|
export function startRunViaSocket(
|
|
|
|
|
body: StartRunRequest,
|
2026-04-11 15:59:14 +08:00
|
|
|
onEvent: (event: RunEvent) => void,
|
|
|
|
|
onDone: () => void,
|
|
|
|
|
onError: (err: Error) => void,
|
2026-04-29 16:26:24 +08:00
|
|
|
onStarted?: (runId: string) => void,
|
|
|
|
|
): { abort: () => void } {
|
|
|
|
|
const socket = connectChatRun()
|
2026-04-11 15:59:14 +08:00
|
|
|
let closed = false
|
|
|
|
|
|
2026-04-29 16:26:24 +08:00
|
|
|
function cleanup() {
|
2026-04-11 15:59:14 +08:00
|
|
|
if (closed) return
|
2026-04-29 16:26:24 +08:00
|
|
|
closed = true
|
|
|
|
|
socket.off('run.started', onRunStarted)
|
|
|
|
|
socket.off('run.failed', onRunFailed)
|
|
|
|
|
socket.off('message.delta', onMessageDelta)
|
|
|
|
|
socket.off('reasoning.delta', onReasoningDelta)
|
|
|
|
|
socket.off('thinking.delta', onReasoningDelta)
|
|
|
|
|
socket.off('reasoning.available', onReasoningAvailable)
|
|
|
|
|
socket.off('tool.started', onToolStarted)
|
|
|
|
|
socket.off('tool.completed', onToolCompleted)
|
|
|
|
|
socket.off('run.completed', onRunCompleted)
|
|
|
|
|
socket.off('compression.started', onCompressionStarted)
|
|
|
|
|
socket.off('compression.completed', onCompressionCompleted)
|
|
|
|
|
socket.off('usage.updated', onUsageUpdated)
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|
|
|
|
|
|
2026-04-30 20:17:38 +08:00
|
|
|
// All event handlers share the same cleanup logic.
|
|
|
|
|
// IMPORTANT: The Socket.IO connection is shared across all in-flight runs
|
|
|
|
|
// (single namespace, single socket). When two sessions run concurrently,
|
|
|
|
|
// every `startRunViaSocket()` call registers its own `message.delta` /
|
|
|
|
|
// `tool.*` / `run.*` listeners on the SAME socket, so each event would
|
|
|
|
|
// fan out to every listener and corrupt the wrong session's transcript.
|
|
|
|
|
// The server tags every payload with `session_id`; we filter here so each
|
|
|
|
|
// run only sees its own events. We also accept untagged events (for
|
|
|
|
|
// backwards compatibility) when no session_id was provided in the request.
|
|
|
|
|
const expectedSid = body.session_id
|
2026-04-29 16:26:24 +08:00
|
|
|
const handleEvent = (event: RunEvent) => {
|
2026-04-11 15:59:14 +08:00
|
|
|
if (closed) return
|
2026-04-30 20:17:38 +08:00
|
|
|
// Filter events by session_id to prevent cross-session contamination
|
|
|
|
|
if (expectedSid && event.session_id && event.session_id !== expectedSid) {
|
|
|
|
|
return
|
|
|
|
|
}
|
2026-04-30 16:40:37 +08:00
|
|
|
try {
|
|
|
|
|
onEvent(event)
|
|
|
|
|
} finally {
|
|
|
|
|
if (event.event === 'run.completed' || event.event === 'run.failed') {
|
|
|
|
|
cleanup()
|
|
|
|
|
onDone()
|
|
|
|
|
}
|
2026-04-29 16:26:24 +08:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function onRunStarted(data: RunEvent) {
|
|
|
|
|
handleEvent(data)
|
|
|
|
|
onStarted?.(data.run_id || '')
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|
2026-04-29 16:26:24 +08:00
|
|
|
function onRunFailed(data: RunEvent) {
|
|
|
|
|
handleEvent(data)
|
|
|
|
|
onError?.(new Error(data.error || 'Run failed'))
|
|
|
|
|
}
|
|
|
|
|
function onMessageDelta(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onReasoningDelta(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onThinkingDelta(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onReasoningAvailable(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onToolStarted(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onToolCompleted(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onRunCompleted(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onCompressionStarted(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onCompressionCompleted(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
function onUsageUpdated(data: RunEvent) { handleEvent(data) }
|
|
|
|
|
|
|
|
|
|
socket.on('run.started', onRunStarted)
|
|
|
|
|
socket.on('run.failed', onRunFailed)
|
|
|
|
|
socket.on('message.delta', onMessageDelta)
|
|
|
|
|
socket.on('reasoning.delta', onReasoningDelta)
|
|
|
|
|
socket.on('thinking.delta', onThinkingDelta)
|
|
|
|
|
socket.on('reasoning.available', onReasoningAvailable)
|
|
|
|
|
socket.on('tool.started', onToolStarted)
|
|
|
|
|
socket.on('tool.completed', onToolCompleted)
|
|
|
|
|
socket.on('run.completed', onRunCompleted)
|
|
|
|
|
socket.on('compression.started', onCompressionStarted)
|
|
|
|
|
socket.on('compression.completed', onCompressionCompleted)
|
|
|
|
|
socket.on('usage.updated', onUsageUpdated)
|
|
|
|
|
|
|
|
|
|
// Emit run:start with ack callback to get run_id
|
|
|
|
|
socket.emit('run', body)
|
2026-04-11 15:59:14 +08:00
|
|
|
|
|
|
|
|
return {
|
|
|
|
|
abort: () => {
|
|
|
|
|
if (!closed) {
|
2026-04-29 16:26:24 +08:00
|
|
|
socket.emit('abort', { session_id: body.session_id })
|
|
|
|
|
cleanup()
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|
|
|
|
|
},
|
2026-04-29 16:26:24 +08:00
|
|
|
}
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
export async function fetchModels(): Promise<{ data: Array<{ id: string }> }> {
|
2026-04-16 08:38:18 +08:00
|
|
|
return request('/api/hermes/v1/models')
|
2026-04-11 15:59:14 +08:00
|
|
|
}
|