Added TODO list, moved git repo to local clone cuz github is supa reliable
This commit is contained in:
parent
aeecb88f7d
commit
e0f2a8fb53
2
TODO.md
Normal file
2
TODO.md
Normal file
@ -0,0 +1,2 @@
|
||||
Check to see if the docker containers exist, remove them, then rebuild them.
|
||||
If the container is older than two weeks, rebuild.
|
||||
@ -5,7 +5,7 @@ docker run --name ik-llama-dw-$(date +%Y-%m-%d) --gpus=all $BASE_IMAGE /bin/bash
|
||||
'apt-get update
|
||||
apt-get --yes upgrade
|
||||
apt-get --yes install build-essential git libcurl4-openssl-dev curl libgomp1 cmake
|
||||
git clone https://github.com/ikawrakow/ik_llama.cpp
|
||||
git clone https://gitea.delony.net/jdelony/ik_llama.cpp
|
||||
cd ik_llama.cpp
|
||||
cmake -B build -DGGML_NATIVE=ON -DGGML_CUDA=ON
|
||||
cmake --build build --config Release -j$(nproc)'
|
||||
|
||||
@ -5,7 +5,7 @@ docker run --name llama-dw-$(date +%Y-%m-%d) --gpus=all $BASE_IMAGE /bin/bash -c
|
||||
'apt-get update
|
||||
apt-get --yes upgrade
|
||||
apt-get --yes install build-essential git libcurl4-openssl-dev curl libgomp1 cmake
|
||||
git clone https://github.com/ggml-org/llama.cpp
|
||||
git clone https://gitea.delony.net/jdelony/llama.cpp
|
||||
cd llama.cpp
|
||||
cmake -B build -DGGML_NATIVE=ON -DGGML_CUDA=ON
|
||||
cmake --build build --config Release -j$(nproc)'
|
||||
|
||||
59
sulphur-prompt-enhance.sh
Normal file
59
sulphur-prompt-enhance.sh
Normal file
@ -0,0 +1,59 @@
|
||||
#!/bin/bash
|
||||
#grab container image name
|
||||
MODEL_NAME="sulphur-prompt"
|
||||
CONT_NAME="LLM-$MODEL_NAME"
|
||||
|
||||
MODEL_FOLDER="/home/jared/.cache"
|
||||
MODEL="huggingface/hub/models--SulphurAI--Sulphur-2-base/snapshots/b0ba1217a7c1eedca26afff4f5d53f77b951e4db/prompt_enhancer/sulphur_prompt_enhancer_model-q8_0.gguf"
|
||||
MODEL_MM="huggingface/hub/models--SulphurAI--Sulphur-2-base/snapshots/b0ba1217a7c1eedca26afff4f5d53f77b951e4db/prompt_enhancer/mmproj-BF16.gguf"
|
||||
|
||||
PORT=8555
|
||||
|
||||
set -e
|
||||
|
||||
# Check if llama_env.sh exists, if not run create_new_image.sh
|
||||
if [ ! -f "./env/llama_env.sh" ]; then
|
||||
echo "llama_env.sh not found, running create_new_image.sh..."
|
||||
./create_new_image.sh
|
||||
fi
|
||||
source ./env/llama_env.sh
|
||||
|
||||
# Check and remove container
|
||||
if docker inspect "$CONT_NAME" > /dev/null 2>&1; then
|
||||
echo "✓ Container '$CONT_NAME' found"
|
||||
|
||||
# Check if container is running
|
||||
if docker inspect -f '{{.State.Running}}' "$CONT_NAME" | grep -q "true"; then
|
||||
echo "⚠ Container is running, forcing removal..."
|
||||
fi
|
||||
|
||||
# Remove container
|
||||
if docker rm -f "$CONT_NAME"; then
|
||||
echo "✓ Container removed successfully. Creating new container."
|
||||
exit 0
|
||||
else
|
||||
echo "✗ Failed to remove container"
|
||||
exit 1
|
||||
fi
|
||||
else
|
||||
echo "ℹ Container '$CONT_NAME' does not exist. Creating new container."
|
||||
fi
|
||||
|
||||
#create container
|
||||
docker container create --name $CONT_NAME --network llms -p $PORT:$PORT -v $MODEL_FOLDER:/model --user $(id -u):$(id -g) --gpus=all --restart on-failure:3 \
|
||||
--health-cmd "curl -f http://$CONT_NAME:$PORT/v1/models || exit 1" \
|
||||
--health-interval 5s \
|
||||
--health-timeout 5s \
|
||||
--health-start-period 20s \
|
||||
$IMAGE \
|
||||
/llama.cpp/build/bin/llama-server \
|
||||
--model /model/$MODEL \
|
||||
-mm /model/$MODEL_MM \
|
||||
--alias $MODEL_NAME \
|
||||
-ctk q8_0 -ctv q8_0 \
|
||||
--host $CONT_NAME \
|
||||
--port $PORT --no-mmap -dio \
|
||||
--reasoning off -c 16384 -np 2
|
||||
|
||||
echo "Done!"
|
||||
docker container start -a $CONT_NAME
|
||||
Loading…
x
Reference in New Issue
Block a user