We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8b35acd commit 98595e2Copy full SHA for 98595e2
.github/workflows/et-gguf.yml
@@ -86,6 +86,10 @@ jobs:
86
- name: Run inference
87
run: |
88
export MODEL_DIR=/tmp
89
+ export GGUF_PATH=${PWD}/gguf_files/llama-2-7b.Q4_0.gguf
90
+ export TOKENIZER_PATH=${PWD}/gguf_files/tokenizer.model
91
+ export MODEL_NAME=llama-2-7b_Q4_0_gguf
92
+
93
python export.py --tokenizer-path ${TOKENIZER_PATH} --gguf-path ${GGUF_PATH} --output-pte-path ${MODEL_DIR}/${MODEL_NAME}.pte
94
python generate.py --tokenizer-path ${TOKENIZER_PATH} --gguf-path ${GGUF_PATH} --temperature 0 --pte-path ${MODEL_DIR}/${MODEL_NAME}.pte > ./output_et
95
cat ./output_et
0 commit comments