diff --git a/llama.cpp b/llama.cpp index 854bb8993..e4517959a 100644 --- a/llama.cpp +++ b/llama.cpp @@ -1229,7 +1229,9 @@ static llama_vocab::id llama_sample_top_p_top_k( } } - sample_top_k(logits_id, top_k); + if (top_k > 0 && top_k < n_logits) { + sample_top_k(logits_id, top_k); + } float maxl = -std::numeric_limits::infinity(); for (const auto & kv : logits_id) {