File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -574,7 +574,7 @@ int32_t llama_kv_cache_unified::find_slot(const llama_ubatch & ubatch) const {
574
574
575
575
// can we use this cell? either:
576
576
// - the cell is empty
577
- // - the cell is occupied only by the same sequence, and the sequence is not masked
577
+ // - the cell is occupied only by the same sequence, and the pos is masked
578
578
const bool can_use =
579
579
cells.is_empty (head_cur + i) ||
580
580
(
@@ -2277,7 +2277,7 @@ llama_memory_decode_state_ptr llama_kv_cache_recurrent::init(const llama_batch &
2277
2277
}
2278
2278
2279
2279
bool llama_kv_cache_recurrent::prepare (const std::vector<llama_ubatch> & ubatches) {
2280
- // simply remember the full state
2280
+ // simply remember the full state because it is very small for this type of cache
2281
2281
// TODO: optimize
2282
2282
auto org_cells = cells;
2283
2283
auto org_used = used;
You can’t perform that action at this time.
0 commit comments