top-p: correct gt to gte

2023-06-20 20:48:09 -04:00 · 2023-06-20 20:48:09 -04:00 · 407b77cdb3
commit 407b77cdb3
parent 1e7755cfcb
1 changed files with 3 additions and 2 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -2005,8 +2005,9 @@ void llama_sample_top_p(struct llama_context * ctx, llama_token_data_array * can
    for (size_t i = 0; i < candidates->size; ++i) {
        cum_sum += candidates->data[i].p;

-        // Check if the running sum is greater than p or if we have kept at least min_keep tokens
-        if (cum_sum > p && i + 1 >= min_keep) {
+        // Check if the running sum is at least p or if we have kept at least min_keep tokens
+        // we set the last index to i+1 to indicate that the current iterate should be included in the set
+        if (cum_sum >= p && i + 1 >= min_keep) {
            last_idx = i + 1;
            break;
        }