2026-05-22 10:10:11 +08:00
|
|
|
import { Injectable, Logger } from '@nestjs/common';
|
2026-05-21 23:57:59 +08:00
|
|
|
import type { AiChatDto } from './dto/ai-chat.dto';
|
|
|
|
|
|
2026-05-22 00:20:34 +08:00
|
|
|
const HERMES_API_URL = 'http://10.2.0.7:8642/v1/chat/completions';
|
|
|
|
|
const HERMES_API_KEY = 'zhixi-hermes-key-2026';
|
|
|
|
|
|
2026-05-21 23:57:59 +08:00
|
|
|
@Injectable()
|
|
|
|
|
export class AdminAiChatService {
|
|
|
|
|
private readonly logger = new Logger(AdminAiChatService.name);
|
|
|
|
|
|
2026-05-22 10:10:11 +08:00
|
|
|
constructor() {}
|
2026-05-21 23:57:59 +08:00
|
|
|
|
|
|
|
|
async chat(dto: AiChatDto) {
|
2026-05-22 10:28:41 +08:00
|
|
|
return await this.callHermes(dto.messages);
|
2026-05-22 00:20:34 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private async callHermes(messages: Array<{ role: string; content: string }>) {
|
|
|
|
|
const start = Date.now();
|
|
|
|
|
const resp = await fetch(HERMES_API_URL, {
|
|
|
|
|
method: 'POST',
|
|
|
|
|
headers: {
|
|
|
|
|
'Content-Type': 'application/json',
|
|
|
|
|
Authorization: 'Bearer ' + HERMES_API_KEY,
|
|
|
|
|
},
|
|
|
|
|
body: JSON.stringify({
|
|
|
|
|
model: 'hermes-agent',
|
|
|
|
|
messages,
|
|
|
|
|
temperature: 0.7,
|
|
|
|
|
max_tokens: 4096,
|
|
|
|
|
}),
|
|
|
|
|
signal: AbortSignal.timeout(120_000),
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
if (!resp.ok) {
|
2026-05-22 10:10:11 +08:00
|
|
|
const text = await resp.text().catch(() => '');
|
|
|
|
|
throw new Error(`Hermes API error ${resp.status}: ${text}`);
|
2026-05-22 00:20:34 +08:00
|
|
|
}
|
2026-05-21 23:57:59 +08:00
|
|
|
|
2026-05-22 00:20:34 +08:00
|
|
|
const data = await resp.json();
|
|
|
|
|
const content = data.choices?.[0]?.message?.content || '';
|
|
|
|
|
const usage = data.usage || {};
|
|
|
|
|
|
|
|
|
|
this.logger.log('Hermes chat: ' + (Date.now() - start) + 'ms, tokens: ' +
|
|
|
|
|
(usage.prompt_tokens || 0) + '/' + (usage.completion_tokens || 0));
|
|
|
|
|
return { content, usage: { model: 'hermes-agent', inputTokens: usage.prompt_tokens, outputTokens: usage.completion_tokens } };
|
|
|
|
|
}
|
|
|
|
|
|
2026-05-22 00:02:14 +08:00
|
|
|
getDashboardConfig() {
|
|
|
|
|
return {
|
|
|
|
|
url: 'http://10.2.0.7:9119',
|
2026-05-22 00:20:34 +08:00
|
|
|
apiUrl: 'http://10.2.0.7:8642/v1',
|
|
|
|
|
description: 'Hermes Agent Dashboard — 4核4G 上的 AI Agent',
|
2026-05-22 00:02:14 +08:00
|
|
|
};
|
|
|
|
|
}
|
2026-05-22 10:10:11 +08:00
|
|
|
}
|