|
|
@@ -183,7 +183,7 @@ llama_kv_cache_unified::llama_kv_cache_unified(
|
|
|
const size_t memory_size_k = size_k_bytes();
|
|
|
const size_t memory_size_v = size_v_bytes();
|
|
|
|
|
|
- LLAMA_LOG_INFO("%s: size = %7.2f MiB (%6u cells, %3d layers, %2u/%2u seqs), K (%s): %7.2f MiB, V (%s): %7.2f MiB\n", __func__,
|
|
|
+ LLAMA_LOG_INFO("%s: size = %7.2f MiB (%6u cells, %3d layers, %2u/%u seqs), K (%s): %7.2f MiB, V (%s): %7.2f MiB\n", __func__,
|
|
|
(float)(memory_size_k + memory_size_v) / (1024.0f * 1024.0f), kv_size, (int) layers.size(), n_seq_max, n_stream,
|
|
|
ggml_type_name(type_k), (float)memory_size_k / (1024.0f * 1024.0f),
|
|
|
ggml_type_name(type_v), (float)memory_size_v / (1024.0f * 1024.0f));
|