We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7381f1d commit a8640c6Copy full SHA for a8640c6
tensorrt_llm/executor/result.py
@@ -228,6 +228,9 @@ def _handle_sequence(self,
228
output.logprobs = response_tensors.log_probs[src_idx]
229
# overcome some WAR in the cpp executor
230
if finish_reasons[src_idx] != tllm.FinishReason.CANCELLED:
231
+ if len(output.logprobs) > output.length:
232
+ # WAR [nvbug 5398806]
233
+ output.logprobs = output.logprobs[:output.length]
234
assert len(output.logprobs) == output.length
235
if response_tensors.generation_logits is not None:
236
output.generation_logits = response_tensors.generation_logits[
0 commit comments