181 lines
6.3 KiB
TypeScript
181 lines
6.3 KiB
TypeScript
import { createOpenAI } from '@ai-sdk/openai';
|
|
import { generateText as aiGenerateText, embed, stepCountIs } from 'ai';
|
|
import { AIProvider, TagSuggestion, TitleSuggestion, ToolUseOptions, ToolCallResult } from '../types';
|
|
import { cleanAIJsonResponse, cleanAITextResponse } from '../utils/clean-ai-response';
|
|
|
|
export class CustomOpenAIProvider implements AIProvider {
|
|
private model: any;
|
|
private embeddingModel: any;
|
|
private apiKey: string;
|
|
private baseUrl: string;
|
|
|
|
constructor(
|
|
apiKey: string,
|
|
baseUrl: string,
|
|
modelName: string = 'gpt-4o-mini',
|
|
embeddingModelName: string = 'text-embedding-3-small'
|
|
) {
|
|
this.apiKey = apiKey;
|
|
this.baseUrl = baseUrl.endsWith('/') ? baseUrl.slice(0, -1) : baseUrl;
|
|
// Create OpenAI-compatible client with custom base URL
|
|
// Use .chat() to force /chat/completions endpoint (avoids Responses API)
|
|
const customClient = createOpenAI({
|
|
baseURL: baseUrl,
|
|
apiKey: apiKey,
|
|
fetch: async (url, options) => {
|
|
const headers = new Headers(options?.headers);
|
|
headers.set('HTTP-Referer', 'https://localhost:3000');
|
|
headers.set('X-Title', 'Memento AI');
|
|
// Disable DeepSeek extended thinking for reliable tool/function calling
|
|
if (options?.body) {
|
|
try {
|
|
const body = JSON.parse(options.body as string)
|
|
if (
|
|
typeof body.model === 'string' &&
|
|
(body.model.includes('deepseek') || body.model.includes('thinking') || body.model.includes('reasoner'))
|
|
) {
|
|
body.thinking = { type: 'disabled' }
|
|
}
|
|
return fetch(url, { ...options, headers, body: JSON.stringify(body) })
|
|
} catch { /* ignore parse errors */ }
|
|
}
|
|
return fetch(url, { ...options, headers });
|
|
}
|
|
});
|
|
|
|
this.model = customClient.chat(modelName);
|
|
this.embeddingModel = customClient.embedding(embeddingModelName);
|
|
}
|
|
|
|
async generateTags(content: string): Promise<TagSuggestion[]> {
|
|
try {
|
|
const { text } = await aiGenerateText({
|
|
model: this.model,
|
|
prompt: `Analyze the following note and suggest 1 to 5 relevant tags.
|
|
Note content: "${content.substring(0, 1500)}"
|
|
Return ONLY a JSON array of tag objects, like: [{"tag":"example","confidence":0.9}]`,
|
|
});
|
|
|
|
const cleaned = cleanAIJsonResponse(text)
|
|
const parsed = JSON.parse(cleaned);
|
|
const arr = Array.isArray(parsed) ? parsed : (parsed.tags || parsed.suggestions || []);
|
|
return arr.map((t: any) => ({
|
|
tag: t.tag || t.label || t.name || '',
|
|
confidence: t.confidence || t.score || 0.7,
|
|
}));
|
|
} catch (e) {
|
|
console.error('Error generating tags (Custom OpenAI):', e);
|
|
return [];
|
|
}
|
|
}
|
|
|
|
async getEmbeddings(text: string): Promise<number[]> {
|
|
try {
|
|
const { embedding } = await embed({
|
|
model: this.embeddingModel,
|
|
value: text,
|
|
});
|
|
return embedding;
|
|
} catch (e) {
|
|
console.error('Error generating embeddings (Custom OpenAI):', e);
|
|
throw e;
|
|
}
|
|
}
|
|
|
|
async generateTitles(prompt: string): Promise<TitleSuggestion[]> {
|
|
try {
|
|
// Use generateText instead of generateObject — DeepSeek/MiniMax don't support
|
|
// response_format: json_schema via the OpenAI compat layer
|
|
const { text } = await aiGenerateText({
|
|
model: this.model,
|
|
prompt: prompt,
|
|
})
|
|
|
|
const cleaned = cleanAIJsonResponse(text)
|
|
const parsed = JSON.parse(cleaned)
|
|
const titles = Array.isArray(parsed) ? parsed : (parsed.titles || parsed.suggestions || [])
|
|
return titles.map((t: any) => ({
|
|
title: typeof t === 'string' ? t : t.title || t.name || '',
|
|
confidence: typeof t === 'number' ? t : (t.confidence || t.score || 0.5),
|
|
}))
|
|
} catch (e) {
|
|
console.error('Error generating titles (Custom OpenAI):', e)
|
|
return []
|
|
}
|
|
}
|
|
|
|
|
|
|
|
async generateText(prompt: string): Promise<string> {
|
|
try {
|
|
const { text } = await aiGenerateText({
|
|
model: this.model,
|
|
prompt: prompt,
|
|
});
|
|
|
|
return cleanAITextResponse(text).trim();
|
|
} catch (e) {
|
|
console.error('Error generating text (Custom OpenAI):', e);
|
|
throw e;
|
|
}
|
|
}
|
|
|
|
async chat(messages: any[], systemPrompt?: string): Promise<any> {
|
|
try {
|
|
const { text } = await aiGenerateText({
|
|
model: this.model,
|
|
system: systemPrompt,
|
|
messages: messages,
|
|
});
|
|
|
|
return { text: text.trim() };
|
|
} catch (e) {
|
|
console.error('Error in chat (Custom OpenAI):', e);
|
|
throw e;
|
|
}
|
|
}
|
|
|
|
async generateWithTools(options: ToolUseOptions): Promise<ToolCallResult> {
|
|
const { tools, maxSteps = 10, systemPrompt, messages, prompt } = options
|
|
|
|
const buildOpts = (steps: number): Record<string, any> => {
|
|
const opts: Record<string, any> = { model: this.model, tools, stopWhen: stepCountIs(steps) }
|
|
if (systemPrompt) opts.system = systemPrompt
|
|
if (messages) opts.messages = messages
|
|
else if (prompt) opts.prompt = prompt
|
|
return opts
|
|
}
|
|
|
|
const toResult = (r: any): ToolCallResult => ({
|
|
toolCalls: r.toolCalls?.map((tc: any) => ({ toolName: tc.toolName, input: tc.input })) || [],
|
|
toolResults: r.toolResults?.map((tr: any) => ({ toolName: tr.toolName, input: tr.input, output: tr.output })) || [],
|
|
text: r.text,
|
|
steps: r.steps?.map((step: any) => ({
|
|
text: step.text,
|
|
toolCalls: step.toolCalls?.map((tc: any) => ({ toolName: tc.toolName, input: tc.input })) || [],
|
|
toolResults: step.toolResults?.map((tr: any) => ({ toolName: tr.toolName, input: tr.input, output: tr.output })) || [],
|
|
})) || [],
|
|
})
|
|
|
|
try {
|
|
const result = await aiGenerateText(buildOpts(maxSteps) as any)
|
|
return toResult(result)
|
|
} catch (err: any) {
|
|
// DeepSeek reasoning/thinking models require reasoning_content to be passed back
|
|
// between multi-step calls, which the AI SDK doesn't handle via the OpenAI-compat layer.
|
|
// Retry with a single step so the model calls the tool directly.
|
|
const msg: string = err?.message || String(err)
|
|
if (msg.includes('reasoning_content') || msg.includes('thinking mode')) {
|
|
console.warn('[CustomOpenAI] Reasoning model detected — retrying with maxSteps=1')
|
|
const result = await aiGenerateText(buildOpts(1) as any)
|
|
return toResult(result)
|
|
}
|
|
throw err
|
|
}
|
|
}
|
|
|
|
getModel() {
|
|
return this.model;
|
|
}
|
|
}
|