Fix GLM45v launch server cuda torch compile bug (#9554)

This commit is contained in:
Binyao Jiang
2025-08-25 13:46:28 -07:00
committed by GitHub
parent 3affa9dcc3
commit 24a8cee66d

View File

@@ -526,6 +526,7 @@ class Qwen2_5_VLForConditionalGeneration(nn.Module):
def get_input_embeddings(self):
return self.model.embed_tokens
@torch.no_grad()
def forward(
self,
input_ids: torch.Tensor,