trustgraph/trustgraph_configurator/templates/1.6/components/tgi-service-intel-gpu.jsonnet
elpresidank 74cc8a4685 Squashed 'ai-context/trustgraph-templates/' content from commit 42a5fd1b
git-subtree-dir: ai-context/trustgraph-templates
git-subtree-split: 42a5fd1b678f32be378062e30451e2052ccb95dd
2026-04-05 21:09:49 -05:00

65 lines
1.9 KiB
Jsonnet

local base = import "base/base.jsonnet";
local images = import "values/images.jsonnet";
{
with:: function(key, value)
self + {
["tgi-service-" + key]:: value,
},
"tgi-service-model":: "teknium/OpenHermes-2.5-Mistral-7B",
"tgi-service-cpus":: "8.0",
"tgi-service-memory":: "16G",
"tgi-service" +: {
create:: function(engine)
local vol = engine.volume("tgi-storage").with_size("20G");
local container =
engine.container("tgi-service")
.with_image(images["tgi-service-intel-xpu"])
.with_command([
"--model-id",
$["tgi-service-model"],
"--cuda-graphs",
"0",
"--port",
"8899"
])
.with_environment({
HF_TOKEN: $["hf-token"],
})
.with_privileged(true)
.with_device("/dev/dri", "/dev/dri")
.with_ipc("host")
.with_capability("SYS_NICE")
.with_limits(
$["tgi-service-cpus"], $["tgi-service-memory"]
)
.with_reservations(
$["tgi-service-cpus"], $["tgi-service-memory"]
)
.with_port(8899, 8899, "tgi")
.with_volume_mount(vol, "/data");
local containerSet = engine.containers(
"tgi-service", [ container ]
);
local service =
engine.service(containerSet)
.with_port(8899, 8899, "tgi");
engine.resources([
vol,
containerSet,
service,
])
},
}