|
@@ -13,6 +13,8 @@ elif [[ "$arg1" == '--quantize' || "$arg1" == '-q' ]]; then
|
|
|
exec ./llama-quantize "$@"
|
|
exec ./llama-quantize "$@"
|
|
|
elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then
|
|
elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then
|
|
|
exec ./llama-cli "$@"
|
|
exec ./llama-cli "$@"
|
|
|
|
|
+elif [[ "$arg1" == '--run-legacy' || "$arg1" == '-l' ]]; then
|
|
|
|
|
+ exec ./llama-completion "$@"
|
|
|
elif [[ "$arg1" == '--bench' || "$arg1" == '-b' ]]; then
|
|
elif [[ "$arg1" == '--bench' || "$arg1" == '-b' ]]; then
|
|
|
exec ./llama-bench "$@"
|
|
exec ./llama-bench "$@"
|
|
|
elif [[ "$arg1" == '--perplexity' || "$arg1" == '-p' ]]; then
|
|
elif [[ "$arg1" == '--perplexity' || "$arg1" == '-p' ]]; then
|
|
@@ -32,8 +34,10 @@ elif [[ "$arg1" == '--server' || "$arg1" == '-s' ]]; then
|
|
|
else
|
|
else
|
|
|
echo "Unknown command: $arg1"
|
|
echo "Unknown command: $arg1"
|
|
|
echo "Available commands: "
|
|
echo "Available commands: "
|
|
|
- echo " --run (-r): Run a model previously converted into ggml"
|
|
|
|
|
- echo " ex: -m /models/7B/ggml-model-q4_0.bin -p \"Building a website can be done in 10 simple steps:\" -n 512"
|
|
|
|
|
|
|
+ echo " --run (-r): Run a model (chat) previously converted into ggml"
|
|
|
|
|
+ echo " ex: -m /models/7B/ggml-model-q4_0.bin"
|
|
|
|
|
+ echo " --run-legacy (-l): Run a model (legacy completion) previously converted into ggml"
|
|
|
|
|
+ echo " ex: -m /models/7B/ggml-model-q4_0.bin -no-cnv -p \"Building a website can be done in 10 simple steps:\" -n 512"
|
|
|
echo " --bench (-b): Benchmark the performance of the inference for various parameters."
|
|
echo " --bench (-b): Benchmark the performance of the inference for various parameters."
|
|
|
echo " ex: -m model.gguf"
|
|
echo " ex: -m model.gguf"
|
|
|
echo " --perplexity (-p): Measure the perplexity of a model over a given text."
|
|
echo " --perplexity (-p): Measure the perplexity of a model over a given text."
|