fixes based on review (@JohannesGaessler)

2024-02-29 00:41:31 +09:00 · 2024-02-29 00:41:31 +09:00 · e4896e71b5
commit e4896e71b5
parent 94f6256fd0
1 changed files with 4 additions and 4 deletions
--- a/examples/speculative/speculative.cpp
+++ b/examples/speculative/speculative.cpp
@ -218,7 +218,7 @@ int main(int argc, char ** argv) {
                    // stochastic verification

                    llama_token_data_array dist_tgt = llama_sampling_probability_distribution(ctx_sampling, ctx_tgt, NULL, drafts[s_keep].i_batch_tgt[i_dft]);
-                    float p_tgt, p_dft;
+                    float p_tgt = 0, p_dft = 0;

                    // GGML_ASSERT(dist_tgt.size() == dist_dft.size());
                    for (int s = 0; s < n_seq_dft; ++s) {
@ -239,7 +239,7 @@ int main(int argc, char ** argv) {

                        float r = u_dist(r_gen) / (float) RAND_MAX;
                        llama_token_data_array dist_dft = drafts[s].dist[i_dft];
-                        // acquire the probability of the token from the draft model
+                        // acquire the token probabilities assigned by the draft and target models
                        for (int i = 0; i < dist_tgt.size; i++) {
                            if (dist_tgt.data[i].id == drafts[s].tokens[i_dft]) {
                                p_tgt = dist_tgt.data[i].p;
@ -295,7 +295,7 @@ int main(int argc, char ** argv) {
                        for(int i = s; i < n_seq_dft; i++) {
                            if (drafts[i].tokens[i_dft] == drafts[s].tokens[i_dft]) {
                                // synchronize active status for sequences with the same drafted token
-                                drafts[i].active = drafts[i].active & accept;
+                                drafts[i].active = drafts[i].active && accept;
                            }
                        }