Skip to content

Commit fa384cb

Browse files
metascroymalfet
authored andcommitted
switch to smaller model to speed up CI test (#210)
1 parent eeffb0a commit fa384cb

File tree

1 file changed

+5
-4
lines changed

1 file changed

+5
-4
lines changed

.github/workflows/compile-gguf.yml

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -35,15 +35,16 @@ jobs:
3535
- name: Download GGUF
3636
run: |
3737
mkdir gguf_files
38-
export GGUF_PATH=gguf_files/llama-2-7b.Q4_0.gguf
38+
export GGUF_PATH=gguf_files/TinyLlama-1.1B-openorca.Q4_0.gguf
3939
export TOKENIZER_PATH=gguf_files/tokenizer.model
40-
wget -O ${GGUF_PATH} "https://huggingface.co/TheBloke/Llama-2-7B-GGUF/resolve/main/llama-2-7b.Q4_0.gguf?download=true"
40+
41+
wget -O ${GGUF_PATH} "https://huggingface.co/TheBloke/TinyLlama-1.1B-1T-OpenOrca-GGUF/resolve/main/tinyllama-1.1b-1t-openorca.Q4_0.gguf?download=true"
4142
wget -O ${TOKENIZER_PATH} https://github.com/karpathy/llama2.c/raw/master/tokenizer.model
4243
- name: Run inference
4344
run: |
44-
export GGUF_PATH=gguf_files/llama-2-7b.Q4_0.gguf
45+
export GGUF_PATH=gguf_files/TinyLlama-1.1B-openorca.Q4_0.gguf
4546
export TOKENIZER_PATH=gguf_files/tokenizer.model
46-
export MODEL_NAME=llama-2-7b.Q4_0.gguf
47+
export MODEL_NAME=TinyLlama-1.1B-openorca.Q4_0.gguf
4748
export MODEL_DIR=/tmp
4849
4950
echo "******************************************"

0 commit comments

Comments
 (0)