File tree Expand file tree Collapse file tree 1 file changed +3
-4
lines changed Expand file tree Collapse file tree 1 file changed +3
-4
lines changed Original file line number Diff line number Diff line change @@ -37,6 +37,9 @@ int main(int argc, char ** argv) {
37
37
return 1 ;
38
38
}
39
39
40
+ // for probabilities to be computed even with temp = 0
41
+ params.sparams .n_probs = 16 ;
42
+
40
43
// max number of parallel drafting sequences (i.e. tree branches)
41
44
const int n_seq_dft = params.n_parallel ;
42
45
@@ -182,10 +185,6 @@ int main(int argc, char ** argv) {
182
185
// draft sequence data
183
186
std::vector<seq_draft> drafts (n_seq_dft);
184
187
185
- if (params.sparams .temp == 0 ) {
186
- params.sparams .temp = -1 .0f ; // force greedy sampling with probs for the draft model
187
- }
188
-
189
188
for (int s = 0 ; s < n_seq_dft; ++s) {
190
189
// allocate llama_sampling for each draft sequence
191
190
drafts[s].smpl = llama_sampling_init (model_dft, params.sparams );
You can’t perform that action at this time.
0 commit comments