update instruct and think containers
This commit is contained in:
@@ -17,7 +17,7 @@ AddDevice=/dev/dri
|
|||||||
|
|
||||||
# Server command
|
# Server command
|
||||||
Exec=--port 8002 \
|
Exec=--port 8002 \
|
||||||
-c 16000 \
|
-c 64000 \
|
||||||
--perf \
|
--perf \
|
||||||
-v \
|
-v \
|
||||||
--top-k 20 \
|
--top-k 20 \
|
||||||
|
|||||||
@@ -17,12 +17,17 @@ AddDevice=/dev/dri
|
|||||||
|
|
||||||
# Server command
|
# Server command
|
||||||
Exec=--port 8000 \
|
Exec=--port 8000 \
|
||||||
-c 64000 \
|
-c 128000 \
|
||||||
|
--top-k 64 \
|
||||||
|
--top-p 0.95 \
|
||||||
|
--temp 1.0 \
|
||||||
--perf \
|
--perf \
|
||||||
|
-v \
|
||||||
--n-gpu-layers all \
|
--n-gpu-layers all \
|
||||||
--jinja \
|
--jinja \
|
||||||
--models-max 1 \
|
-m /models/gemma-4-26b-a4b/gemma-4-26B-A4B-it-UD-Q8_K_XL.gguf \
|
||||||
--models-dir /models
|
--mmproj /models/gemma-4-26b-a4b/mmproj-BF16.gguf \
|
||||||
|
--alias think
|
||||||
|
|
||||||
# Health Check
|
# Health Check
|
||||||
HealthCmd=CMD-SHELL curl --fail http://127.0.0.1:8000/health || exit 1
|
HealthCmd=CMD-SHELL curl --fail http://127.0.0.1:8000/health || exit 1
|
||||||
|
|||||||
Reference in New Issue
Block a user