2024-07-10 23:20:06 +01:00
|
|
|
|
|
|
|
|
import _pulsar
|
|
|
|
|
|
2024-08-20 17:54:11 +01:00
|
|
|
from .. schema import TextCompletionRequest, TextCompletionResponse
|
|
|
|
|
from .. schema import text_completion_request_queue
|
|
|
|
|
from .. schema import text_completion_response_queue
|
2024-08-22 17:02:18 +01:00
|
|
|
from . base import BaseClient
|
2024-07-23 21:34:03 +01:00
|
|
|
|
2024-07-10 23:20:06 +01:00
|
|
|
# Ugly
|
|
|
|
|
ERROR=_pulsar.LoggerLevel.Error
|
|
|
|
|
WARN=_pulsar.LoggerLevel.Warn
|
|
|
|
|
INFO=_pulsar.LoggerLevel.Info
|
|
|
|
|
DEBUG=_pulsar.LoggerLevel.Debug
|
|
|
|
|
|
2024-08-22 17:02:18 +01:00
|
|
|
class LlmClient(BaseClient):
|
2024-07-10 23:20:06 +01:00
|
|
|
|
|
|
|
|
def __init__(
|
2024-08-05 22:05:28 +01:00
|
|
|
self, log_level=ERROR,
|
|
|
|
|
subscriber=None,
|
|
|
|
|
input_queue=None,
|
|
|
|
|
output_queue=None,
|
2024-07-10 23:20:06 +01:00
|
|
|
pulsar_host="pulsar://pulsar:6650",
|
|
|
|
|
):
|
|
|
|
|
|
2024-08-22 17:02:18 +01:00
|
|
|
if input_queue is None: input_queue = text_completion_request_queue
|
|
|
|
|
if output_queue is None: output_queue = text_completion_response_queue
|
|
|
|
|
|
|
|
|
|
super(LlmClient, self).__init__(
|
|
|
|
|
log_level=log_level,
|
|
|
|
|
subscriber=subscriber,
|
|
|
|
|
input_queue=input_queue,
|
|
|
|
|
output_queue=output_queue,
|
|
|
|
|
pulsar_host=pulsar_host,
|
|
|
|
|
input_schema=TextCompletionRequest,
|
|
|
|
|
output_schema=TextCompletionResponse,
|
2024-07-10 23:20:06 +01:00
|
|
|
)
|
|
|
|
|
|
2024-11-05 22:46:17 +00:00
|
|
|
def request(self, system, prompt, timeout=300):
|
|
|
|
|
return self.call(
|
|
|
|
|
system=system, prompt=prompt, timeout=timeout
|
|
|
|
|
).response
|
2024-07-10 23:20:06 +01:00
|
|
|
|