Fixed qwen3-coder
This commit is contained in:
parent
38d8f2eccc
commit
e513c097ce
@ -6,10 +6,17 @@ MODEL_FOLDER="/sam4t/ENC/LLM/Qwen3-Coder-Next"
|
||||
|
||||
source ./env.sh
|
||||
echo $IK_IMAGE
|
||||
docker run --name ik_$MODEL_NAME --network host -v $MODEL_FOLDER:/model --gpus=all $IK_IMAGE /ik_llama.cpp/build/bin/llama-server \
|
||||
docker run --name ik_$MODEL_NAME -d --network llms -p 8654:8654 -v $MODEL_FOLDER:/model --gpus=all \
|
||||
--health-cmd "curl -f http://ik_$MODEL_NAME:8654/v1/models || exit 1" \
|
||||
--health-interval 15s \
|
||||
--health-timeout 5s \
|
||||
--health-start-period 15s \
|
||||
$IK_IMAGE \
|
||||
/ik_llama.cpp/build/bin/llama-server \
|
||||
--model /model/$MODEL \
|
||||
-ctk q8_0 -ctv q8_0 \
|
||||
--parallel 1 --threads 32 \
|
||||
--host ik_$MODEL_NAME \
|
||||
--port 8654 -ngl 99 \
|
||||
--alias $MODEL_NAME \
|
||||
--no-mmap --jinja \
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user