Explorar o código

llama : remember and restore kv cache data pointers (#1104)

because their value is stored in buf and overwritten by memcpy
xaedes %!s(int64=2) %!d(string=hai) anos
pai
achega
8687c1f258
Modificáronse 1 ficheiros con 4 adicións e 0 borrados
  1. 4 0
      llama.cpp

+ 4 - 0
llama.cpp

@@ -2092,7 +2092,11 @@ void llama_set_kv_cache(
                          int   n_token_count) {
     // Make sure we have the same kv cache setup
     LLAMA_ASSERT(ctx->model.kv_self.buf.size == n_size);
+    void * k_data = ctx->model.kv_self.k->data; // remember data pointers
+    void * v_data = ctx->model.kv_self.v->data; // because their value is stored in buf and overwritten by memcpy
     memcpy(ctx->model.kv_self.buf.addr, kv_cache, n_size);
+    ctx->model.kv_self.k->data = k_data; // restore correct data pointers
+    ctx->model.kv_self.v->data = v_data;
     ctx->model.kv_self.n = n_token_count;
 }