llama.cpp/quantize.sh at c494ed5b94b429d3d73721235e78c9f5fa6e5652 - llama.cpp - Gitea: Git with a cup of tea

root/llama.cpp

mirror of https://github.com/ggerganov/llama.cpp.git synced 2024-12-26 11:24:35 +00:00

Pavol Rusnak d1f224712d

Add quantize script for batch quantization (#92 )

* Add quantize script for batch quantization

* Indentation

* README for new quantize.sh

* Fix script name

* Fix file list on Mac OS

---------

Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>

2023-03-13 18:15:20 +02:00

16 lines

309 B

Bash

Executable File

Raw Blame History

 #!/usr/bin/env bash
 if ! [[ "$1" =~ ^[0-9]{1,2}B$ ]]; then
     echo
     echo "Usage: quantize.sh 7B|13B|30B|65B [--remove-f16]"
     echo
     exit 1
 fi
 for i in `ls models/$1/ggml-model-f16.bin*`; do
     ./quantize "$i" "${i/f16/q4_0}" 2
     if [[ "$2" == "--remove-f16" ]]; then
         rm "$i"
     fi
 done