[Speculative decoding] [Bugfix] Fix overallocation in ngram + spec logprobs (#4672)
This commit is contained in:
parent
f942efb5a3
commit
8b9241be3a
@ -138,7 +138,7 @@ class NGramWorker(LoraNotSupportedWorkerBase):
|
|||||||
SamplerOutput(
|
SamplerOutput(
|
||||||
outputs=None,
|
outputs=None,
|
||||||
sampled_token_probs=token_probs[i],
|
sampled_token_probs=token_probs[i],
|
||||||
logprobs=token_logprobs,
|
logprobs=token_logprobs[i],
|
||||||
sampled_token_ids=token_ids[i],
|
sampled_token_ids=token_ids[i],
|
||||||
))
|
))
|
||||||
return outputs, False
|
return outputs, False
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user