run-cli.sh 1.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152
  1. #!/bin/sh
  2. #
  3. # Basedir on device
  4. basedir=/data/local/tmp/llama.cpp
  5. cli_opts=
  6. branch=.
  7. [ "$B" != "" ] && branch=$B
  8. adbserial=
  9. [ "$S" != "" ] && adbserial="-s $S"
  10. model="Llama-3.2-3B-Instruct-Q4_0.gguf"
  11. [ "$M" != "" ] && model="$M"
  12. device="HTP0"
  13. [ "$D" != "" ] && device="$D"
  14. verbose=
  15. [ "$V" != "" ] && verbose="GGML_HEXAGON_VERBOSE=$V"
  16. experimental=
  17. [ "$E" != "" ] && experimental="GGML_HEXAGON_EXPERIMENTAL=$E"
  18. sched=
  19. [ "$SCHED" != "" ] && sched="GGML_SCHED_DEBUG=2" cli_opts="$cli_opts -v"
  20. profile=
  21. [ "$PROF" != "" ] && profile="GGML_HEXAGON_PROFILE=$PROF GGML_HEXAGON_OPSYNC=1"
  22. opmask=
  23. [ "$OPMASK" != "" ] && opmask="GGML_HEXAGON_OPMASK=$OPMASK"
  24. nhvx=
  25. [ "$NHVX" != "" ] && nhvx="GGML_HEXAGON_NHVX=$NHVX"
  26. ndev=
  27. [ "$NDEV" != "" ] && ndev="GGML_HEXAGON_NDEV=$NDEV"
  28. set -x
  29. adb $adbserial shell " \
  30. cd $basedir; ulimit -c unlimited; \
  31. LD_LIBRARY_PATH=$basedir/$branch/lib \
  32. ADSP_LIBRARY_PATH=$basedir/$branch/lib \
  33. $verbose $experimental $sched $opmask $profile $nhvx $ndev \
  34. ./$branch/bin/llama-cli --no-mmap -m $basedir/../gguf/$model \
  35. -t 4 --ctx-size 8192 --batch-size 128 -ctk q8_0 -ctv q8_0 -fa on \
  36. -ngl 99 --device $device $cli_opts $@ \
  37. "