diff --git a/gpttype_adapter.cpp b/gpttype_adapter.cpp index 5b76b74920422..4e0140b7c905b 100644 --- a/gpttype_adapter.cpp +++ b/gpttype_adapter.cpp @@ -3611,7 +3611,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs) { logits_to_sample = draft_results.drafted_amount; } - while(logits_sampled0 && !abort_draft) + while(logits_sampled0 && !abort_draft && !early_abort) { if(logits_sampled>0) {