mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	fix: graceful shutdown for Docker images (#10815)
This commit is contained in:
		| @@ -8,11 +8,11 @@ arg1="$1" | ||||
| shift | ||||
|  | ||||
| if [[ "$arg1" == '--convert' || "$arg1" == '-c' ]]; then | ||||
|     python3 ./convert_hf_to_gguf.py "$@" | ||||
|     exec python3 ./convert_hf_to_gguf.py "$@" | ||||
| elif [[ "$arg1" == '--quantize' || "$arg1" == '-q' ]]; then | ||||
|     ./llama-quantize "$@" | ||||
|     exec ./llama-quantize "$@" | ||||
| elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then | ||||
|     ./llama-cli "$@" | ||||
|     exec ./llama-cli "$@" | ||||
| elif [[ "$arg1" == '--all-in-one' || "$arg1" == '-a' ]]; then | ||||
|     echo "Converting PTH to GGML..." | ||||
|     for i in `ls $1/$2/ggml-model-f16.bin*`; do | ||||
| @@ -20,11 +20,11 @@ elif [[ "$arg1" == '--all-in-one' || "$arg1" == '-a' ]]; then | ||||
|             echo "Skip model quantization, it already exists: ${i/f16/q4_0}" | ||||
|         else | ||||
|             echo "Converting PTH to GGML: $i into ${i/f16/q4_0}..." | ||||
|             ./llama-quantize "$i" "${i/f16/q4_0}" q4_0 | ||||
|             exec ./llama-quantize "$i" "${i/f16/q4_0}" q4_0 | ||||
|         fi | ||||
|     done | ||||
| elif [[ "$arg1" == '--server' || "$arg1" == '-s' ]]; then | ||||
|     ./llama-server "$@" | ||||
|     exec ./llama-server "$@" | ||||
| else | ||||
|     echo "Unknown command: $arg1" | ||||
|     echo "Available commands: " | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Corentin REGAL
					Corentin REGAL