@@ -74,8 +74,6 @@ int main(int argc, char ** argv) {
7474 auto next_token = llama_sampler_sample (smpl, ctx, -1 );
7575 auto next_token_str = llama_token_to_piece (ctx, next_token);
7676
77- llama_sampler_accept (smpl, next_token);
78-
7977 printf (" %s" , next_token_str.c_str ());
8078 result0 += next_token_str;
8179
@@ -132,8 +130,6 @@ int main(int argc, char ** argv) {
132130 auto next_token = llama_sampler_sample (smpl2, ctx2, -1 );
133131 auto next_token_str = llama_token_to_piece (ctx2, next_token);
134132
135- llama_sampler_accept (smpl2, next_token);
136-
137133 printf (" %s" , next_token_str.c_str ());
138134 result1 += next_token_str;
139135
@@ -222,8 +218,6 @@ int main(int argc, char ** argv) {
222218 auto next_token = llama_sampler_sample (smpl3, ctx3, -1 );
223219 auto next_token_str = llama_token_to_piece (ctx3, next_token);
224220
225- llama_sampler_accept (smpl3, next_token);
226-
227221 printf (" %s" , next_token_str.c_str ());
228222 result2 += next_token_str;
229223
0 commit comments