You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
llama_token token = model.vocab.token_bos(); // not actually used by llama_build_graph, but required to choose between token and embedding inputs graph
292
292
293
+
// restore later
294
+
// TODO: something cleaner
295
+
constauto n_outputs_save = n_outputs;
296
+
293
297
// max number of outputs
294
298
n_outputs = n_tokens;
295
299
@@ -341,6 +345,8 @@ llama_context::llama_context(
341
345
}
342
346
}
343
347
348
+
n_outputs = n_outputs_save;
349
+
344
350
for (size_t i = 0; i < backend_ptrs.size(); ++i) {
0 commit comments