1
0

comp.sh 502 B

12345678
  1. #!/bin/bash
  2. echo "Running converted model."
  3. llama-cli -no-cnv -m reference/qwen3_ntl/qwen3_ntl.gguf -p "Once upon a time" -n 30 --temp 0 &> data/tinylong-30-tok.txt
  4. echo "Running original model."
  5. python examples/model-conversion/scripts/causal/run-org-model-multi-token.py --model-path reference/qwen3_ntl --num-tokens 30 --prompt "Once upon a time" &> data/tinylong-30-tok-org.txt
  6. echo "Running tensor comparison."
  7. python reference/compare_tensors.py 30 16 &> data/tinylong-30-compare.txt
  8. echo "Done."