File tree Expand file tree Collapse file tree 4 files changed +4
-4
lines changed Expand file tree Collapse file tree 4 files changed +4
-4
lines changed Original file line number Diff line number Diff line change @@ -23,7 +23,7 @@ ENV CUDA_DOCKER_ARCH=${CUDA_DOCKER_ARCH}
23
23
# Enable CUDA
24
24
ENV LLAMA_CUDA=1
25
25
26
- RUN make -j$(nproc) llama
26
+ RUN make -j$(nproc) llama-cli
27
27
28
28
FROM ${BASE_CUDA_RUN_CONTAINER} as runtime
29
29
Original file line number Diff line number Diff line change @@ -40,6 +40,6 @@ ENV LLAMA_HIPBLAS=1
40
40
ENV CC=/opt/rocm/llvm/bin/clang
41
41
ENV CXX=/opt/rocm/llvm/bin/clang++
42
42
43
- RUN make -j$(nproc) llama
43
+ RUN make -j$(nproc) llama-cli
44
44
45
45
ENTRYPOINT [ "/app/llama-cli" ]
Original file line number Diff line number Diff line change @@ -9,7 +9,7 @@ WORKDIR /app
9
9
10
10
COPY . .
11
11
12
- RUN make -j$(nproc) llama
12
+ RUN make -j$(nproc) llama-cli
13
13
14
14
FROM ubuntu:$UBUNTU_VERSION as runtime
15
15
Original file line number Diff line number Diff line change @@ -240,7 +240,7 @@ jobs:
240
240
echo "Fetch llama2c model"
241
241
wget https://huggingface.co/karpathy/tinyllamas/resolve/main/stories260K/stories260K.bin
242
242
./bin/convert-llama2c-to-ggml --copy-vocab-from-model ./tok512.bin --llama2c-model stories260K.bin --llama2c-output-model stories260K.gguf
243
- ./bin/llama -m stories260K.gguf -p "One day, Lily met a Shoggoth" -n 500 -c 256
243
+ ./bin/llama-cli -m stories260K.gguf -p "One day, Lily met a Shoggoth" -n 500 -c 256
244
244
245
245
- name : Determine tag name
246
246
id : tag
You can’t perform that action at this time.
0 commit comments