mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-19 10:35:01 +08:00
[Model] [gpt-oss] fix gpt-oss pp support (#23815)
Signed-off-by: zjy0516 <riverclouds.zhu@qq.com>
This commit is contained in:
parent
a3432f18fd
commit
bfab219648
@ -668,9 +668,8 @@ class GptOssForCausalLM(nn.Module, SupportsPP):
|
|||||||
positions: torch.Tensor,
|
positions: torch.Tensor,
|
||||||
intermediate_tensors: Optional[IntermediateTensors] = None,
|
intermediate_tensors: Optional[IntermediateTensors] = None,
|
||||||
inputs_embeds: Optional[torch.Tensor] = None) -> torch.Tensor:
|
inputs_embeds: Optional[torch.Tensor] = None) -> torch.Tensor:
|
||||||
assert intermediate_tensors is None
|
return self.model(input_ids, positions, intermediate_tensors,
|
||||||
assert inputs_embeds is None
|
inputs_embeds)
|
||||||
return self.model(input_ids, positions)
|
|
||||||
|
|
||||||
def compute_logits(self, hidden_states: torch.Tensor,
|
def compute_logits(self, hidden_states: torch.Tensor,
|
||||||
sampling_metadata: SamplingMetadata) -> torch.Tensor:
|
sampling_metadata: SamplingMetadata) -> torch.Tensor:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user