@@ -270,19 +270,17 @@ int main(int argc, char ** argv) {
270
270
}
271
271
}
272
272
273
+ LOGLN (
274
+ " recalculate the cached logits (check): embd_inp.empty() %s, n_matching_session_tokens %zu, embd_inp.size() %zu, session_tokens.size() %zu, embd_inp.size() %zu" ,
275
+ LOG_TOSTR (embd_inp.empty ()), n_matching_session_tokens, embd_inp.size (), session_tokens.size (), embd_inp.size ())
276
+
273
277
// if we will use the cache for the full prompt without reaching the end of the cache, force
274
278
// reevaluation of the last token token to recalculate the cached logits
275
279
if (!embd_inp.empty () && n_matching_session_tokens == embd_inp.size () &&
276
280
session_tokens.size () > embd_inp.size ()) {
277
- #ifndef _WIN32
278
- LOG (
279
- " recalculate the cached logits: embd_inp.empty() %s, n_matching_session_tokens %lu, embd_inp.size() %lu, session_tokens.size() %lu, embd_inp.size() %lu, session_tokens.resize( %lu )" ,
280
- LOG_TOSTR (embd_inp.empty ()), n_matching_session_tokens, embd_inp.size (), session_tokens.size (), embd_inp.size (), embd_inp.size () - 1 )
281
- #else
282
- LOG (
283
- " recalculate the cached logits: embd_inp.empty() %s, n_matching_session_tokens %llu, embd_inp.size() %llu, session_tokens.size() %llu, embd_inp.size() %llu, session_tokens.resize( %llu )" ,
284
- LOG_TOSTR (embd_inp.empty ()), n_matching_session_tokens, embd_inp.size (), session_tokens.size (), embd_inp.size (), embd_inp.size () - 1 )
285
- #endif
281
+
282
+ LOGLN (" recalculate the cached logits (do): session_tokens.resize( %zu )" , embd_inp.size () - 1 )
283
+
286
284
session_tokens.resize (embd_inp.size () - 1 );
287
285
}
288
286
0 commit comments