fix: graceful shutdown for Docker images (#10815)

author Corentin REGAL <redacted>

Fri, 13 Dec 2024 17:23:50 +0000 (18:23 +0100)

committer GitHub <redacted>

Fri, 13 Dec 2024 17:23:50 +0000 (18:23 +0100)
author Corentin REGAL <redacted>
Fri, 13 Dec 2024 17:23:50 +0000 (18:23 +0100)
committer GitHub <redacted>
Fri, 13 Dec 2024 17:23:50 +0000 (18:23 +0100)
diff --git a/.devops/tools.sh b/.devops/tools.sh

index 24dcfd35079cb73236dc80d911480bcbacc7008d..9a86e6ea0185df68d5174cdd517a872e3bce83c8 100755 (executable)
--- a/.devops/tools.sh
+++ b/.devops/tools.sh
@@ -8,11 +8,11 @@ arg1="$1"
  shift
  
  if [[ "$arg1" == '--convert' || "$arg1" == '-c' ]]; then
-    python3 ./convert_hf_to_gguf.py "$@"
+    exec python3 ./convert_hf_to_gguf.py "$@"
  elif [[ "$arg1" == '--quantize' || "$arg1" == '-q' ]]; then
-    ./llama-quantize "$@"
+    exec ./llama-quantize "$@"
  elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then
-    ./llama-cli "$@"
+    exec ./llama-cli "$@"
  elif [[ "$arg1" == '--all-in-one' || "$arg1" == '-a' ]]; then
      echo "Converting PTH to GGML..."
      for i in `ls $1/$2/ggml-model-f16.bin*`; do
@@ -20,11 +20,11 @@ elif [[ "$arg1" == '--all-in-one' || "$arg1" == '-a' ]]; then
              echo "Skip model quantization, it already exists: ${i/f16/q4_0}"
          else
              echo "Converting PTH to GGML: $i into ${i/f16/q4_0}..."
-            ./llama-quantize "$i" "${i/f16/q4_0}" q4_0
+            exec ./llama-quantize "$i" "${i/f16/q4_0}" q4_0
          fi
      done
  elif [[ "$arg1" == '--server' || "$arg1" == '-s' ]]; then
-    ./llama-server "$@"
+    exec ./llama-server "$@"
  else
      echo "Unknown command: $arg1"
      echo "Available commands: "
author	Corentin REGAL <redacted>
	Fri, 13 Dec 2024 17:23:50 +0000 (18:23 +0100)
committer	GitHub <redacted>
	Fri, 13 Dec 2024 17:23:50 +0000 (18:23 +0100)