1
0

run-cli.sh 1.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253
  1. #!/bin/sh
  2. #
  3. # Basedir on device
  4. basedir=/data/local/tmp/llama.cpp
  5. cli_opts=
  6. branch=.
  7. [ "$B" != "" ] && branch=$B
  8. adbserial=
  9. [ "$S" != "" ] && adbserial="-s $S"
  10. model="Llama-3.2-3B-Instruct-Q4_0.gguf"
  11. [ "$M" != "" ] && model="$M"
  12. device="HTP0"
  13. [ "$D" != "" ] && device="$D"
  14. verbose=
  15. [ "$V" != "" ] && verbose="GGML_HEXAGON_VERBOSE=$V"
  16. experimental=
  17. [ "$E" != "" ] && experimental="GGML_HEXAGON_EXPERIMENTAL=$E"
  18. sched=
  19. [ "$SCHED" != "" ] && sched="GGML_SCHED_DEBUG=2" cli_opts="$cli_opts -v"
  20. profile=
  21. [ "$PROF" != "" ] && profile="GGML_HEXAGON_PROFILE=$PROF GGML_HEXAGON_OPSYNC=1"
  22. opmask=
  23. [ "$OPMASK" != "" ] && opmask="GGML_HEXAGON_OPMASK=$OPMASK"
  24. nhvx=
  25. [ "$NHVX" != "" ] && nhvx="GGML_HEXAGON_NHVX=$NHVX"
  26. ndev=
  27. [ "$NDEV" != "" ] && ndev="GGML_HEXAGON_NDEV=$NDEV"
  28. set -x
  29. adb $adbserial shell " \
  30. cd $basedir; ulimit -c unlimited; \
  31. LD_LIBRARY_PATH=$basedir/$branch/lib \
  32. ADSP_LIBRARY_PATH=$basedir/$branch/lib \
  33. $verbose $experimental $sched $opmask $profile $nhvx $ndev \
  34. ./$branch/bin/llama-completion --no-mmap -m $basedir/../gguf/$model \
  35. --poll 1000 -t 6 --cpu-mask 0xfc --cpu-strict 1 \
  36. --ctx-size 8192 --batch-size 128 -ctk q8_0 -ctv q8_0 -fa on \
  37. -ngl 99 --device $device $cli_opts $@ \
  38. "