update instruct and think containers
This commit is contained in:
@@ -17,12 +17,17 @@ AddDevice=/dev/dri
|
||||
|
||||
# Server command
|
||||
Exec=--port 8000 \
|
||||
-c 64000 \
|
||||
-c 128000 \
|
||||
--top-k 64 \
|
||||
--top-p 0.95 \
|
||||
--temp 1.0 \
|
||||
--perf \
|
||||
-v \
|
||||
--n-gpu-layers all \
|
||||
--jinja \
|
||||
--models-max 1 \
|
||||
--models-dir /models
|
||||
-m /models/gemma-4-26b-a4b/gemma-4-26B-A4B-it-UD-Q8_K_XL.gguf \
|
||||
--mmproj /models/gemma-4-26b-a4b/mmproj-BF16.gguf \
|
||||
--alias think
|
||||
|
||||
# Health Check
|
||||
HealthCmd=CMD-SHELL curl --fail http://127.0.0.1:8000/health || exit 1
|
||||
|
||||
Reference in New Issue
Block a user