mirror of
https://github.com/trustgraph-ai/trustgraph.git
synced 2026-07-01 17:39:39 +02:00
Use Effect primitives for AI and response fanout
This commit is contained in:
parent
8f47456a4b
commit
24a2447cc3
5 changed files with 392 additions and 59 deletions
|
|
@ -4,12 +4,14 @@ import {
|
|||
errorMessage,
|
||||
makeLlmServiceShape,
|
||||
type LlmChunk,
|
||||
type LlmResult,
|
||||
type LlmProvider,
|
||||
} from "@trustgraph/base";
|
||||
import { Config, Effect, Layer, Ref, Result, Stream } from "effect";
|
||||
import { Config, Effect, Layer, ManagedRuntime, Ref, Result, Stream } from "effect";
|
||||
import * as O from "effect/Option";
|
||||
import * as Predicate from "effect/Predicate";
|
||||
import * as S from "effect/Schema";
|
||||
import { AiError, LanguageModel, Prompt, Response } from "effect/unstable/ai";
|
||||
|
||||
export class TextCompletionConfigError extends S.TaggedErrorClass<TextCompletionConfigError>()(
|
||||
"TextCompletionConfigError",
|
||||
|
|
@ -32,6 +34,21 @@ export type TextCompletionRuntimeError =
|
|||
| TextCompletionProviderError
|
||||
| TooManyRequestsError;
|
||||
|
||||
export interface LanguageModelProviderRequest {
|
||||
readonly model: string;
|
||||
readonly temperature: number;
|
||||
}
|
||||
|
||||
export interface LanguageModelProviderOptions<Requirements> {
|
||||
readonly provider: string;
|
||||
readonly defaultModel: string;
|
||||
readonly defaultTemperature: number;
|
||||
readonly runtime: ManagedRuntime.ManagedRuntime<Requirements, TextCompletionRuntimeError>;
|
||||
readonly makeLanguageModel: (
|
||||
request: LanguageModelProviderRequest,
|
||||
) => Effect.Effect<LanguageModel.Service, TextCompletionRuntimeError, Requirements>;
|
||||
}
|
||||
|
||||
export const makeTextCompletionLayer = <E, R>(
|
||||
provider: Effect.Effect<LlmProvider, E, R>,
|
||||
): Layer.Layer<Llm, E, R> =>
|
||||
|
|
@ -83,6 +100,33 @@ const textChunk = (model: string, text: string): LlmChunk => ({
|
|||
isFinal: false,
|
||||
});
|
||||
|
||||
const effectAiProviderError = (
|
||||
provider: string,
|
||||
error: unknown,
|
||||
): TextCompletionRuntimeError => {
|
||||
if (
|
||||
AiError.isAiError(error) &&
|
||||
(error.reason._tag === "RateLimitError" || error.reason._tag === "QuotaExhaustedError")
|
||||
) {
|
||||
return TooManyRequestsError.make({ message: "Rate limit exceeded" });
|
||||
}
|
||||
return providerRuntimeError(provider, error);
|
||||
};
|
||||
|
||||
const usageInputTokens = (usage: Response.Usage): number =>
|
||||
usage.inputTokens.total ?? 0;
|
||||
|
||||
const usageOutputTokens = (usage: Response.Usage): number =>
|
||||
usage.outputTokens.total ?? 0;
|
||||
|
||||
const languageModelPrompt = (
|
||||
system: string,
|
||||
prompt: string,
|
||||
): Prompt.RawInput => [
|
||||
{ role: "system", content: system },
|
||||
{ role: "user", content: [{ type: "text", text: prompt }] },
|
||||
];
|
||||
|
||||
const contentPartText = (part: unknown): O.Option<string> =>
|
||||
Predicate.isObject(part) &&
|
||||
Predicate.hasProperty(part, "text") &&
|
||||
|
|
@ -200,6 +244,105 @@ export const providerStatusError = (
|
|||
: providerRuntimeError(provider, error);
|
||||
};
|
||||
|
||||
const languageModelResult = (
|
||||
response: LanguageModel.GenerateTextResponse<{}>,
|
||||
model: string,
|
||||
): LlmResult => ({
|
||||
text: response.text,
|
||||
inToken: usageInputTokens(response.usage),
|
||||
outToken: usageOutputTokens(response.usage),
|
||||
model,
|
||||
});
|
||||
|
||||
const languageModelStreamChunk = (
|
||||
provider: string,
|
||||
model: string,
|
||||
part: Response.StreamPart<{}>,
|
||||
): Effect.Effect<Result.Result<LlmChunk, undefined>, TextCompletionRuntimeError> => {
|
||||
switch (part.type) {
|
||||
case "text-delta":
|
||||
return Effect.succeed(
|
||||
part.delta.length > 0
|
||||
? Result.succeed(textChunk(model, part.delta))
|
||||
: Result.fail(undefined),
|
||||
);
|
||||
case "finish":
|
||||
return Effect.succeed(
|
||||
Result.succeed(
|
||||
finalChunk(model, {
|
||||
inToken: usageInputTokens(part.usage),
|
||||
outToken: usageOutputTokens(part.usage),
|
||||
}),
|
||||
),
|
||||
);
|
||||
case "error":
|
||||
return Effect.fail(effectAiProviderError(provider, part.error));
|
||||
default:
|
||||
return Effect.succeed(Result.fail(undefined));
|
||||
}
|
||||
};
|
||||
|
||||
const runLanguageModelStream = <RuntimeRequirements, StreamRequirements extends RuntimeRequirements>(
|
||||
runtime: ManagedRuntime.ManagedRuntime<RuntimeRequirements, TextCompletionRuntimeError>,
|
||||
stream: Stream.Stream<LlmChunk, TextCompletionRuntimeError, StreamRequirements>,
|
||||
): AsyncIterable<LlmChunk> => ({
|
||||
[Symbol.asyncIterator]: () => {
|
||||
const iterator = runtime.context().then((context) =>
|
||||
Stream.toAsyncIterableWith(stream, context)[Symbol.asyncIterator]()
|
||||
);
|
||||
return {
|
||||
next: () => iterator.then((current) => current.next()),
|
||||
};
|
||||
},
|
||||
});
|
||||
|
||||
export const makeLanguageModelProvider = <Requirements>(
|
||||
options: LanguageModelProviderOptions<Requirements>,
|
||||
): LlmProvider => ({
|
||||
generateContent: (system, prompt, model, temperature) => {
|
||||
const modelName = model ?? options.defaultModel;
|
||||
const temp = temperature ?? options.defaultTemperature;
|
||||
return options.runtime.runPromise(
|
||||
Effect.gen(function* () {
|
||||
const languageModel = yield* options.makeLanguageModel({
|
||||
model: modelName,
|
||||
temperature: temp,
|
||||
});
|
||||
const response = yield* languageModel.generateText({
|
||||
prompt: languageModelPrompt(system, prompt),
|
||||
}).pipe(
|
||||
Effect.mapError((error) => effectAiProviderError(options.provider, error)),
|
||||
);
|
||||
return languageModelResult(response, modelName);
|
||||
}),
|
||||
);
|
||||
},
|
||||
supportsStreaming: () => true,
|
||||
generateContentStream: (system, prompt, model, temperature) => {
|
||||
const modelName = model ?? options.defaultModel;
|
||||
const temp = temperature ?? options.defaultTemperature;
|
||||
const stream = Stream.unwrap(
|
||||
Effect.gen(function* () {
|
||||
const languageModel = yield* options.makeLanguageModel({
|
||||
model: modelName,
|
||||
temperature: temp,
|
||||
});
|
||||
return languageModel.streamText({
|
||||
prompt: languageModelPrompt(system, prompt),
|
||||
}).pipe(
|
||||
Stream.mapError((error) => effectAiProviderError(options.provider, error)),
|
||||
Stream.filterMapEffect((part) =>
|
||||
languageModelStreamChunk(options.provider, modelName, part)
|
||||
),
|
||||
);
|
||||
}),
|
||||
);
|
||||
return toAsyncGenerator(runLanguageModelStream(options.runtime, stream), (error) =>
|
||||
effectAiProviderError(options.provider, error)
|
||||
);
|
||||
},
|
||||
});
|
||||
|
||||
export const toAsyncGenerator = (
|
||||
iterable: AsyncIterable<LlmChunk>,
|
||||
mapError: (error: unknown) => TextCompletionRuntimeError,
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue