Browse Source

kv-cache : fix k-shift for multiple streams (#14742)

ggml-ci
Georgi Gerganov 6 months ago
parent
commit
d6fb3f6b49
1 changed files with 1 additions and 1 deletions
  1. 1 1
      src/llama-kv-cache-unified.cpp

+ 1 - 1
src/llama-kv-cache-unified.cpp

@@ -1261,7 +1261,7 @@ void llama_kv_cache_unified::set_input_k_shift(ggml_tensor * dst) const {
         const auto & cells = v_cells[s];
         const auto & cells = v_cells[s];
 
 
         for (uint32_t i = 0; i < cells.size(); ++i) {
         for (uint32_t i = 0; i < cells.size(); ++i) {
-            data[i] = cells.is_empty(i) ? 0 : cells.get_shift(i);
+            data[s*cells.size() + i] = cells.is_empty(i) ? 0 : cells.get_shift(i);
         }
         }
     }
     }
 }
 }