File tree Expand file tree Collapse file tree 1 file changed +9
-19
lines changed Expand file tree Collapse file tree 1 file changed +9
-19
lines changed Original file line number Diff line number Diff line change 4
4
# Copyright (C) 2024 Intel Corporation
5
5
# SPDX-License-Identifier: MIT
6
6
7
- INPUT2=" Building a website can be done in 10 simple steps:\nStep 1:"
8
7
source /opt/intel/oneapi/setvars.sh
9
8
10
- if [ $# -gt 0 ]; then
11
- GGML_SYCL_DEVICE=$1
12
- GGML_SYCL_SINGLE_GPU=1
13
- else
14
- GGML_SYCL_DEVICE=0
15
- GGML_SYCL_SINGLE_GPU=0
16
- fi
17
-
18
9
# export GGML_SYCL_DEBUG=1
19
10
20
-
21
11
# ZES_ENABLE_SYSMAN=1, Support to get free memory of GPU by sycl::aspect::ext_intel_free_memory. Recommended to use when --split-mode = layer.
22
12
23
- if [ $GGML_SYCL_SINGLE_GPU -eq 1 ]; then
13
+ INPUT_PROMPT=" Building a website can be done in 10 simple steps:\nStep 1:"
14
+ MODEL_FILE=llama-2-7b.Q4_0.gguf
15
+ NGL=33
16
+
17
+ if [ $# -gt 0 ]; then
18
+ GGML_SYCL_DEVICE=$1
24
19
echo " use $GGML_SYCL_DEVICE as main GPU"
25
20
# use signle GPU only
26
- ZES_ENABLE_SYSMAN=1 ./build/bin/llama-cli -m models/llama-2-7b.Q4_0.gguf -p " ${INPUT2} " -n 400 -e -ngl 33 -s 0 -mg $GGML_SYCL_DEVICE -sm none
21
+ ZES_ENABLE_SYSMAN=1 ./build/bin/llama-cli -m models/${MODEL_FILE} -p " ${INPUT_PROMPT} " -n 400 -e -ngl ${NGL} -s 0 -mg $GGML_SYCL_DEVICE -sm none
22
+
27
23
else
28
24
# use multiple GPUs with same max compute units
29
- ZES_ENABLE_SYSMAN=1 ./build/bin/llama-cli -m models/llama-2-7b.Q4_0.gguf -p " ${INPUT2 } " -n 400 -e -ngl 33 -s 0
25
+ ZES_ENABLE_SYSMAN=1 ./build/bin/llama-cli -m models/${MODEL_FILE} -p " ${INPUT_PROMPT } " -n 400 -e -ngl ${NGL} -s 0
30
26
fi
31
-
32
- # use main GPU only
33
- # ZES_ENABLE_SYSMAN=1 ./build/bin/llama-cli -m models/llama-2-7b.Q4_0.gguf -p "${INPUT2}" -n 400 -e -ngl 33 -s 0 -mg $GGML_SYCL_DEVICE -sm none
34
-
35
- # use multiple GPUs with same max compute units
36
- # ZES_ENABLE_SYSMAN=1 ./build/bin/llama-cli -m models/llama-2-7b.Q4_0.gguf -p "${INPUT2}" -n 400 -e -ngl 33 -s 0
You can’t perform that action at this time.
0 commit comments