File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -594,7 +594,7 @@ int32_t llama_kv_cache_unified::find_slot(const llama_ubatch & ubatch) const {
594
594
595
595
// can we use this cell? either:
596
596
// - the cell is empty
597
- // - the cell is occupied only by the same sequence, and the sequence is not masked
597
+ // - the cell is occupied only by the same sequence, and the pos is masked
598
598
const bool can_use =
599
599
cells.is_empty (head_cur + i) ||
600
600
(
@@ -2307,7 +2307,7 @@ llama_memory_decode_state_ptr llama_kv_cache_recurrent::init(const llama_batch &
2307
2307
}
2308
2308
2309
2309
bool llama_kv_cache_recurrent::prepare (const std::vector<llama_ubatch> & ubatches) {
2310
- // simply remember the full state
2310
+ // simply remember the full state because it is very small for this type of cache
2311
2311
// TODO: optimize
2312
2312
auto org_cells = cells;
2313
2313
auto org_used = used;
You can’t perform that action at this time.
0 commit comments