Просмотр исходного кода

fix: graceful shutdown for Docker images (#10815)

Corentin REGAL 1 год назад
Родитель
Сommit
11e07fd63b
1 измененных файлов с 5 добавлено и 5 удалено
  1. 5 5
      .devops/tools.sh

+ 5 - 5
.devops/tools.sh

@@ -8,11 +8,11 @@ arg1="$1"
 shift
 shift
 
 
 if [[ "$arg1" == '--convert' || "$arg1" == '-c' ]]; then
 if [[ "$arg1" == '--convert' || "$arg1" == '-c' ]]; then
-    python3 ./convert_hf_to_gguf.py "$@"
+    exec python3 ./convert_hf_to_gguf.py "$@"
 elif [[ "$arg1" == '--quantize' || "$arg1" == '-q' ]]; then
 elif [[ "$arg1" == '--quantize' || "$arg1" == '-q' ]]; then
-    ./llama-quantize "$@"
+    exec ./llama-quantize "$@"
 elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then
 elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then
-    ./llama-cli "$@"
+    exec ./llama-cli "$@"
 elif [[ "$arg1" == '--all-in-one' || "$arg1" == '-a' ]]; then
 elif [[ "$arg1" == '--all-in-one' || "$arg1" == '-a' ]]; then
     echo "Converting PTH to GGML..."
     echo "Converting PTH to GGML..."
     for i in `ls $1/$2/ggml-model-f16.bin*`; do
     for i in `ls $1/$2/ggml-model-f16.bin*`; do
@@ -20,11 +20,11 @@ elif [[ "$arg1" == '--all-in-one' || "$arg1" == '-a' ]]; then
             echo "Skip model quantization, it already exists: ${i/f16/q4_0}"
             echo "Skip model quantization, it already exists: ${i/f16/q4_0}"
         else
         else
             echo "Converting PTH to GGML: $i into ${i/f16/q4_0}..."
             echo "Converting PTH to GGML: $i into ${i/f16/q4_0}..."
-            ./llama-quantize "$i" "${i/f16/q4_0}" q4_0
+            exec ./llama-quantize "$i" "${i/f16/q4_0}" q4_0
         fi
         fi
     done
     done
 elif [[ "$arg1" == '--server' || "$arg1" == '-s' ]]; then
 elif [[ "$arg1" == '--server' || "$arg1" == '-s' ]]; then
-    ./llama-server "$@"
+    exec ./llama-server "$@"
 else
 else
     echo "Unknown command: $arg1"
     echo "Unknown command: $arg1"
     echo "Available commands: "
     echo "Available commands: "