/** * OpenAI text completion service. * * Python reference: trustgraph-flow/trustgraph/model/text_completion/openai/llm.py */ import OpenAI from "openai"; import { Llm, makeLlmService, makeFlowProcessorProgram, makeLlmServiceShape, makeLlmSpecs, type LlmProvider, type ProcessorConfig, type LlmResult, type LlmChunk, tooManyRequestsError, } from "@trustgraph/base"; import { Effect, Layer } from "effect"; export type OpenAIProcessorConfig = ProcessorConfig & { model?: string; apiKey?: string; baseUrl?: string; temperature?: number; maxOutput?: number; }; export function makeOpenAIProvider(config: OpenAIProcessorConfig): LlmProvider { const defaultModel = config.model ?? "gpt-4o"; const defaultTemperature = config.temperature ?? 0.0; const maxOutput = config.maxOutput ?? 4096; const apiKey = config.apiKey ?? process.env.OPENAI_TOKEN; if (apiKey === undefined || apiKey.length === 0) { throw new Error("OpenAI API key not specified"); } const client = new OpenAI({ apiKey, baseURL: config.baseUrl ?? process.env.OPENAI_BASE_URL, }); console.log("[OpenAI] LLM service initialized"); return { generateContent: async ( system: string, prompt: string, model?: string, temperature?: number, ): Promise => { const modelName = model ?? defaultModel; const temp = temperature ?? defaultTemperature; try { const resp = await client.chat.completions.create({ model: modelName, messages: [ { role: "system", content: system }, { role: "user", content: prompt }, ], temperature: temp, max_completion_tokens: maxOutput, }); return { text: resp.choices[0].message.content ?? "", inToken: resp.usage?.prompt_tokens ?? 0, outToken: resp.usage?.completion_tokens ?? 0, model: modelName, }; } catch (err) { if (err instanceof OpenAI.RateLimitError) { throw tooManyRequestsError(); } throw err; } }, supportsStreaming: () => true, generateContentStream: async function* ( system: string, prompt: string, model?: string, temperature?: number, ): AsyncGenerator { const modelName = model ?? defaultModel; const temp = temperature ?? defaultTemperature; try { const stream = await client.chat.completions.create({ model: modelName, messages: [ { role: "system", content: system }, { role: "user", content: prompt }, ], temperature: temp, max_completion_tokens: maxOutput, stream: true, stream_options: { include_usage: true }, }); let totalInputTokens = 0; let totalOutputTokens = 0; for await (const chunk of stream) { const content = chunk.choices[0]?.delta?.content; if (content !== null && content !== undefined && content.length > 0) { yield { text: content, inToken: null, outToken: null, model: modelName, isFinal: false, }; } if (chunk.usage !== null && chunk.usage !== undefined) { totalInputTokens = chunk.usage.prompt_tokens; totalOutputTokens = chunk.usage.completion_tokens; } } yield { text: "", inToken: totalInputTokens, outToken: totalOutputTokens, model: modelName, isFinal: true, }; } catch (err) { if (err instanceof OpenAI.RateLimitError) { throw tooManyRequestsError(); } throw err; } }, }; } export type OpenAIProcessor = ReturnType; export function makeOpenAIProcessor(config: OpenAIProcessorConfig): ReturnType { return makeLlmService(config, makeOpenAIProvider(config)); } export const OpenAIProcessor = makeOpenAIProcessor; export const program = makeFlowProcessorProgram({ id: "text-completion", specs: () => makeLlmSpecs(), layer: (config) => Layer.succeed( Llm, Llm.of(makeLlmServiceShape(makeOpenAIProvider(config))), ), }); export async function run(): Promise { await Effect.runPromise(program); }