We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent eed827b commit c92000aCopy full SHA for c92000a
vllm/model_executor/models/granite.py
@@ -428,7 +428,8 @@ def compute_logits(
428
sampling_metadata: SamplingMetadata) -> Optional[torch.Tensor]:
429
logits = self.logits_processor(self.lm_head, hidden_states,
430
sampling_metadata)
431
- logits /= self.config.logits_scaling
+ if logits is not None:
432
+ logits /= self.config.logits_scaling
433
return logits
434
435
def sample(
0 commit comments