Spaces:

ggml-org
/

gguf-my-repo

Running on A10G

File size: 310 Bytes

3eaaf3a
 
 
 
 
 
 
 
 
 
 
 
e510c4e
3eaaf3a
e88cde7
e510c4e
3eaaf3a

#!/bin/bash

if [ ! -d "llama.cpp" ]; then
  # only run in dev env
  git clone https://github.com/ggerganov/llama.cpp
fi

if [[ -z "${RUN_LOCALLY}" ]]; then
  # enable CUDA if NOT running locally
  export LLAMA_CUDA=1
fi

cd llama.cpp
make -j llama-quantize llama-gguf-split llama-imatrix

cd ..
python app.py