Skip to content

Commit 1387ea2

Browse files
authored
llama : pre-allocate input tensors in a separate buffer (#5100)
1 parent 26d6076 commit 1387ea2

File tree

2 files changed

+146
-161
lines changed

2 files changed

+146
-161
lines changed

ggml-alloc.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -109,8 +109,8 @@ void ggml_tallocr_alloc(ggml_tallocr_t alloc, struct ggml_tensor * tensor) {
109109
if (block->size >= size) {
110110
best_fit_block = alloc->n_free_blocks - 1;
111111
} else {
112-
fprintf(stderr, "%s: not enough space in the buffer (needed %zu, largest block available %zu)\n",
113-
__func__, size, max_avail);
112+
fprintf(stderr, "%s: not enough space in the buffer to allocate %s (needed %zu, largest block available %zu)\n",
113+
__func__, tensor->name, size, max_avail);
114114
GGML_ASSERT(!"not enough space in the buffer");
115115
return;
116116
}

0 commit comments

Comments
 (0)