top-p: correct gt to gte
This commit is contained in:
parent
1e7755cfcb
commit
407b77cdb3
1 changed files with 3 additions and 2 deletions
|
@ -2005,8 +2005,9 @@ void llama_sample_top_p(struct llama_context * ctx, llama_token_data_array * can
|
||||||
for (size_t i = 0; i < candidates->size; ++i) {
|
for (size_t i = 0; i < candidates->size; ++i) {
|
||||||
cum_sum += candidates->data[i].p;
|
cum_sum += candidates->data[i].p;
|
||||||
|
|
||||||
// Check if the running sum is greater than p or if we have kept at least min_keep tokens
|
// Check if the running sum is at least p or if we have kept at least min_keep tokens
|
||||||
if (cum_sum > p && i + 1 >= min_keep) {
|
// we set the last index to i+1 to indicate that the current iterate should be included in the set
|
||||||
|
if (cum_sum >= p && i + 1 >= min_keep) {
|
||||||
last_idx = i + 1;
|
last_idx = i + 1;
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue