quantize.sh 309 B

123456789101112131415
  1. #!/usr/bin/env bash
  2. if ! [[ "$1" =~ ^[0-9]{1,2}B$ ]]; then
  3. echo
  4. echo "Usage: quantize.sh 7B|13B|30B|65B [--remove-f16]"
  5. echo
  6. exit 1
  7. fi
  8. for i in `ls models/$1/ggml-model-f16.bin*`; do
  9. ./quantize "$i" "${i/f16/q4_0}" 2
  10. if [[ "$2" == "--remove-f16" ]]; then
  11. rm "$i"
  12. fi
  13. done