Fixed qwen3-coder

This commit is contained in:
Jared Delony 2026-03-18 17:31:21 -05:00
parent 38d8f2eccc
commit e513c097ce
Signed by: jdelony
SSH Key Fingerprint: SHA256:W5F7KMb6FLjlHNhQhtrDl4NvR5fCfinaDDXSQnA2sF0

View File

@ -6,10 +6,17 @@ MODEL_FOLDER="/sam4t/ENC/LLM/Qwen3-Coder-Next"
source ./env.sh
echo $IK_IMAGE
docker run --name ik_$MODEL_NAME --network host -v $MODEL_FOLDER:/model --gpus=all $IK_IMAGE /ik_llama.cpp/build/bin/llama-server \
docker run --name ik_$MODEL_NAME -d --network llms -p 8654:8654 -v $MODEL_FOLDER:/model --gpus=all \
--health-cmd "curl -f http://ik_$MODEL_NAME:8654/v1/models || exit 1" \
--health-interval 15s \
--health-timeout 5s \
--health-start-period 15s \
$IK_IMAGE \
/ik_llama.cpp/build/bin/llama-server \
--model /model/$MODEL \
-ctk q8_0 -ctv q8_0 \
--parallel 1 --threads 32 \
--host ik_$MODEL_NAME \
--port 8654 -ngl 99 \
--alias $MODEL_NAME \
--no-mmap --jinja \