|
|
@@ -324,7 +324,7 @@ int main(int argc, char ** argv) {
|
|
|
log_tostr(embd_inp.empty()), n_matching_session_tokens, embd_inp.size(), session_tokens.size(), embd_inp.size());
|
|
|
|
|
|
// if we will use the cache for the full prompt without reaching the end of the cache, force
|
|
|
- // reevaluation of the last token token to recalculate the cached logits
|
|
|
+ // reevaluation of the last token to recalculate the cached logits
|
|
|
if (!embd_inp.empty() && n_matching_session_tokens == embd_inp.size() && session_tokens.size() > embd_inp.size()) {
|
|
|
LOGLN("recalculate the cached logits (do): session_tokens.resize( %zu )", embd_inp.size() - 1);
|
|
|
|