common : llama_byte_to_token: allow falling back to finding just the token byte in SPM vocabs

akx · akx · commit dce9bc97b94c · 2024-02-13T13:05:51.000+02:00
diff --git a/llama.cpp b/llama.cpp
@@ -7716,7 +7716,12 @@ static llama_token llama_byte_to_token(const llama_vocab & vocab, uint8_t ch) {
     switch (llama_vocab_get_type(vocab)) {
         case LLAMA_VOCAB_TYPE_SPM: {
             const char buf[7] = { '<', '0', 'x', hex[ch >> 4], hex[ch & 15], '>', 0 };
-            return vocab.token_to_id.at(buf);
+            if (vocab.token_to_id.find(buf) != vocab.token_to_id.end()) {
+                return vocab.token_to_id.at(buf);
+            }
+            // Try to fall back to just the byte as a string
+            const char buf2[2] = { (char)ch, 0 };
+            return vocab.token_to_id.at(buf2);
         }
         case LLAMA_VOCAB_TYPE_WPM:
         case LLAMA_VOCAB_TYPE_BPE: {