update instruct and think containers

This commit is contained in:
2026-04-16 16:05:52 -04:00
parent 66f9304cc6
commit e43c534ceb
2 changed files with 9 additions and 4 deletions

View File

@@ -17,12 +17,17 @@ AddDevice=/dev/dri
# Server command
Exec=--port 8000 \
-c 64000 \
-c 128000 \
--top-k 64 \
--top-p 0.95 \
--temp 1.0 \
--perf \
-v \
--n-gpu-layers all \
--jinja \
--models-max 1 \
--models-dir /models
-m /models/gemma-4-26b-a4b/gemma-4-26B-A4B-it-UD-Q8_K_XL.gguf \
--mmproj /models/gemma-4-26b-a4b/mmproj-BF16.gguf \
--alias think
# Health Check
HealthCmd=CMD-SHELL curl --fail http://127.0.0.1:8000/health || exit 1