Momento/memento-note/lib/ai/providers/custom-openai.ts

import { createOpenAI } from '@ai-sdk/openai';
import { generateText as aiGenerateText, embed, stepCountIs } from 'ai';
import { AIProvider, TagSuggestion, TitleSuggestion, ToolUseOptions, ToolCallResult } from '../types';
import { cleanAIJsonResponse, cleanAITextResponse } from '../utils/clean-ai-response';

export class CustomOpenAIProvider implements AIProvider {
  private model: any;
  private embeddingModel: any;
  private apiKey: string;
  private baseUrl: string;

  constructor(
    apiKey: string,
    baseUrl: string,
    modelName: string = 'gpt-4o-mini',
    embeddingModelName: string = 'text-embedding-3-small'
  ) {
    this.apiKey = apiKey;
    this.baseUrl = baseUrl.endsWith('/') ? baseUrl.slice(0, -1) : baseUrl;
    // Create OpenAI-compatible client with custom base URL
    // Use .chat() to force /chat/completions endpoint (avoids Responses API)
    const customClient = createOpenAI({
      baseURL: baseUrl,
      apiKey: apiKey,
      fetch: async (url, options) => {
        const headers = new Headers(options?.headers);
        headers.set('HTTP-Referer', 'https://localhost:3000');
        headers.set('X-Title', 'Memento AI');
        // Disable DeepSeek extended thinking for reliable tool/function calling
        if (options?.body) {
          try {
            const body = JSON.parse(options.body as string)
            if (
              typeof body.model === 'string' &&
              (body.model.includes('deepseek') || body.model.includes('thinking') || body.model.includes('reasoner'))
            ) {
              body.thinking = { type: 'disabled' }
            }
            return fetch(url, { ...options, headers, body: JSON.stringify(body) })
          } catch { /* ignore parse errors */ }
        }
        return fetch(url, { ...options, headers });
      }
    });

    this.model = customClient.chat(modelName);
    this.embeddingModel = customClient.embedding(embeddingModelName);
  }

  async generateTags(content: string): Promise<TagSuggestion[]> {
    try {
      const { text } = await aiGenerateText({
        model: this.model,
        prompt: `Analyze the following note and suggest 1 to 5 relevant tags.
Note content: "${content.substring(0, 1500)}"
Return ONLY a JSON array of tag objects, like: [{"tag":"example","confidence":0.9}]`,
      });

      const cleaned = cleanAIJsonResponse(text)
      const parsed = JSON.parse(cleaned);
      const arr = Array.isArray(parsed) ? parsed : (parsed.tags || parsed.suggestions || []);
      return arr.map((t: any) => ({
        tag: t.tag || t.label || t.name || '',
        confidence: t.confidence || t.score || 0.7,
      }));
    } catch (e) {
      console.error('Error generating tags (Custom OpenAI):', e);
      return [];
    }
  }

  async getEmbeddings(text: string): Promise<number[]> {
    try {
      const { embedding } = await embed({
        model: this.embeddingModel,
        value: text,
      });
      return embedding;
    } catch (e) {
      console.error('Error generating embeddings (Custom OpenAI):', e);
      throw e;
    }
  }

  async generateTitles(prompt: string): Promise<TitleSuggestion[]> {
    try {
      // Use generateText instead of generateObject — DeepSeek/MiniMax don't support
      // response_format: json_schema via the OpenAI compat layer
      const { text } = await aiGenerateText({
        model: this.model,
        prompt: prompt,
      })

      const cleaned = cleanAIJsonResponse(text)
      const parsed = JSON.parse(cleaned)
      const titles = Array.isArray(parsed) ? parsed : (parsed.titles || parsed.suggestions || [])
      return titles.map((t: any) => ({
        title: typeof t === 'string' ? t : t.title || t.name || '',
        confidence: typeof t === 'number' ? t : (t.confidence || t.score || 0.5),
      }))
    } catch (e) {
      console.error('Error generating titles (Custom OpenAI):', e)
      return []
    }
  }


  async generateText(prompt: string): Promise<string> {
    try {
      const { text } = await aiGenerateText({
        model: this.model,
        prompt: prompt,
      });

      return cleanAITextResponse(text).trim();
    } catch (e) {
      console.error('Error generating text (Custom OpenAI):', e);
      throw e;
    }
  }

  async chat(messages: any[], systemPrompt?: string): Promise<any> {
    try {
      const { text } = await aiGenerateText({
        model: this.model,
        system: systemPrompt,
        messages: messages,
      });

      return { text: text.trim() };
    } catch (e) {
      console.error('Error in chat (Custom OpenAI):', e);
      throw e;
    }
  }

  async generateWithTools(options: ToolUseOptions): Promise<ToolCallResult> {
    const { tools, maxSteps = 10, systemPrompt, messages, prompt } = options

    const buildOpts = (steps: number): Record<string, any> => {
      const opts: Record<string, any> = { model: this.model, tools, stopWhen: stepCountIs(steps) }
      if (systemPrompt) opts.system = systemPrompt
      if (messages) opts.messages = messages
      else if (prompt) opts.prompt = prompt
      return opts
    }

    const toResult = (r: any): ToolCallResult => ({
      toolCalls: r.toolCalls?.map((tc: any) => ({ toolName: tc.toolName, input: tc.input })) || [],
      toolResults: r.toolResults?.map((tr: any) => ({ toolName: tr.toolName, input: tr.input, output: tr.output })) || [],
      text: r.text,
      steps: r.steps?.map((step: any) => ({
        text: step.text,
        toolCalls: step.toolCalls?.map((tc: any) => ({ toolName: tc.toolName, input: tc.input })) || [],
        toolResults: step.toolResults?.map((tr: any) => ({ toolName: tr.toolName, input: tr.input, output: tr.output })) || [],
      })) || [],
    })

    try {
      const result = await aiGenerateText(buildOpts(maxSteps) as any)
      return toResult(result)
    } catch (err: any) {
      // DeepSeek reasoning/thinking models require reasoning_content to be passed back
      // between multi-step calls, which the AI SDK doesn't handle via the OpenAI-compat layer.
      // Retry with a single step so the model calls the tool directly.
      const msg: string = err?.message || String(err)
      if (msg.includes('reasoning_content') || msg.includes('thinking mode')) {
        console.warn('[CustomOpenAI] Reasoning model detected — retrying with maxSteps=1')
        const result = await aiGenerateText(buildOpts(1) as any)
        return toResult(result)
      }
      throw err
    }
  }

  getModel() {
    return this.model;
  }
}