llama : sanitize tokens in the upper bound (ggml-org#9359)

slaren · arthw · commit 5f10d4557d17 · 2024-11-15T12:34:21.000+08:00
diff --git a/src/llama.cpp b/src/llama.cpp
@@ -16081,7 +16081,7 @@ static int llama_decode_internal(
     }
 
     for (uint32_t i = 0; i < n_tokens_all; ++i) {
-        if (batch_all.token[i] < 0) {
+        if (batch_all.token[i] < 0 || (uint32_t)batch_all.token[i] >= lctx.model.vocab.n_vocab) {
             LLAMA_LOG_ERROR("%s: invalid token[%d] = %d", __func__, i, batch_all.token[i]);
             return -1;
         }
@@ -16380,7 +16380,7 @@ static int llama_encode_internal(
     }
 
     for (uint32_t i = 0; i < n_tokens; ++i) {
-        if (batch.token[i] < 0) {
+        if (batch.token[i] < 0 || (uint32_t)batch.token[i] >= lctx.model.vocab.n_vocab) {
             LLAMA_LOG_ERROR("%s: invalid token[%d] = %d", __func__, i, batch.token[i]);
             return -1;
         }

Original file line number	Diff line number	Diff line change
`@@ -16081,7 +16081,7 @@ static int llama_decode_internal(`
`16081`	`16081`	`}`
`16082`	`16082`
`16083`	`16083`	`for (uint32_t i = 0; i < n_tokens_all; ++i) {`
`16084`		`- if (batch_all.token[i] < 0) {`
	`16084`	`+ if (batch_all.token[i] < 0 \|\| (uint32_t)batch_all.token[i] >= lctx.model.vocab.n_vocab) {`
`16085`	`16085`	`LLAMA_LOG_ERROR("%s: invalid token[%d] = %d", __func__, i, batch_all.token[i]);`
`16086`	`16086`	`return -1;`
`16087`	`16087`	`}`
`@@ -16380,7 +16380,7 @@ static int llama_encode_internal(`
`16380`	`16380`	`}`
`16381`	`16381`
`16382`	`16382`	`for (uint32_t i = 0; i < n_tokens; ++i) {`
`16383`		`- if (batch.token[i] < 0) {`
	`16383`	`+ if (batch.token[i] < 0 \|\| (uint32_t)batch.token[i] >= lctx.model.vocab.n_vocab) {`
`16384`	`16384`	`LLAMA_LOG_ERROR("%s: invalid token[%d] = %d", __func__, i, batch.token[i]);`
`16385`	`16385`	`return -1;`
`16386`	`16386`	`}`