From d2cf1ab5e2cb8e610c18aff1691bb72cc1eada08 Mon Sep 17 00:00:00 2001 From: Jared Delony Date: Sat, 16 May 2026 16:55:56 -0500 Subject: [PATCH] Fixed the mmproj file flag --- Qwen3.6-35B-A3B-Uncensored-Aggres-noThink.sh | 2 +- Qwen3.6-35B-A3B-Uncensored-Aggres.sh | 3 +-- gemma-4-26B-A4B-mxfp4-noThink.sh | 2 +- gemma-4-26B-A4B-mxfp4.sh | 4 ++-- 4 files changed, 5 insertions(+), 6 deletions(-) diff --git a/Qwen3.6-35B-A3B-Uncensored-Aggres-noThink.sh b/Qwen3.6-35B-A3B-Uncensored-Aggres-noThink.sh index 9e98198..671a302 100755 --- a/Qwen3.6-35B-A3B-Uncensored-Aggres-noThink.sh +++ b/Qwen3.6-35B-A3B-Uncensored-Aggres-noThink.sh @@ -24,7 +24,7 @@ docker container create --name $CONT_NAME --network llms -p $PORT:$PORT -v $MODE $IMAGE \ /llama.cpp/build/bin/llama-server \ --model /model/$MODEL \ - --mm /model/$MODEL_MM \ + -mm /model/$MODEL_MM \ --alias $MODEL_NAME \ -ctk q8_0 -ctv q8_0 \ --reasoning-budget 0 \ diff --git a/Qwen3.6-35B-A3B-Uncensored-Aggres.sh b/Qwen3.6-35B-A3B-Uncensored-Aggres.sh index aa31e62..889488f 100755 --- a/Qwen3.6-35B-A3B-Uncensored-Aggres.sh +++ b/Qwen3.6-35B-A3B-Uncensored-Aggres.sh @@ -7,7 +7,6 @@ MODEL_FOLDER="/home/jared/.cache" MODEL="huggingface/hub/models--HauhauCS--Qwen3.6-35B-A3B-Uncensored-HauhauCS-Aggressive/snapshots/f12a584fecbeb5f20001130d8ecd66c9327ae685/Qwen3.6-35B-A3B-Uncensored-HauhauCS-Aggressive-IQ4_XS.gguf" MODEL_MM="huggingface/hub/models--HauhauCS--Qwen3.6-35B-A3B-Uncensored-HauhauCS-Aggressive/snapshots/f12a584fecbeb5f20001130d8ecd66c9327ae685/mmproj-Qwen3.6-35B-A3B-Uncensored-HauhauCS-Aggressive-f16.gguf" - PORT=8356 # Check if llama_env.sh exists, if not run create_new_image.sh @@ -25,7 +24,7 @@ docker container create --name $CONT_NAME --network llms -p $PORT:$PORT -v $MODE $IMAGE \ /llama.cpp/build/bin/llama-server \ --model /model/$MODEL \ - --mm /model/$MODEL_MM \ + -mm /model/$MODEL_MM \ --alias $MODEL_NAME \ -ctk q8_0 -ctv q8_0 \ --host $CONT_NAME \ diff --git a/gemma-4-26B-A4B-mxfp4-noThink.sh b/gemma-4-26B-A4B-mxfp4-noThink.sh index 036b595..8220fce 100755 --- a/gemma-4-26B-A4B-mxfp4-noThink.sh +++ b/gemma-4-26B-A4B-mxfp4-noThink.sh @@ -25,7 +25,7 @@ docker container create --name $CONT_NAME --network llms -p $PORT:$PORT -v $MODE $IMAGE \ /llama.cpp/build/bin/llama-server \ --model /model/$MODEL \ - --mm /model/$MODEL_MM \ + -mm /model/$MODEL_MM \ --alias $MODEL_NAME \ -ctk q8_0 -ctv q8_0 \ --reasoning-budget 0 \ diff --git a/gemma-4-26B-A4B-mxfp4.sh b/gemma-4-26B-A4B-mxfp4.sh index 954a229..471b4a5 100755 --- a/gemma-4-26B-A4B-mxfp4.sh +++ b/gemma-4-26B-A4B-mxfp4.sh @@ -14,8 +14,8 @@ if [ ! -f "./env/llama_env.sh" ]; then echo "llama_env.sh not found, running create_new_image.sh..." ./create_new_image.sh fi - source ./env/llama_env.sh + echo $IMAGE docker container create --name $CONT_NAME --network llms -p $PORT:$PORT -v $MODEL_FOLDER:/model --user $(id -u):$(id -g) --gpus=all --restart on-failure:3 \ --health-cmd "curl -f http://$CONT_NAME:$PORT/v1/models || exit 1" \ @@ -25,7 +25,7 @@ docker container create --name $CONT_NAME --network llms -p $PORT:$PORT -v $MODE $IMAGE \ /llama.cpp/build/bin/llama-server \ --model /model/$MODEL \ - --mm /model/$MODEL_MM \ + -mm /model/$MODEL_MM \ --alias $MODEL_NAME \ -ctk q8_0 -ctv q8_0 \ --host $CONT_NAME \