use topk_softmax with sgl-kernel (#4439)

This commit is contained in:
Yineng Zhang
2025-03-14 15:59:06 -07:00
committed by GitHub
parent e73167ade3
commit ad1ae7f7cd
18 changed files with 48 additions and 35 deletions

View File

@@ -26,4 +26,4 @@ pip install transformers==4.45.2 sentence_transformers accelerate==1.4.0 peft pa
pip install cuda-python nvidia-cuda-nvrtc-cu12
# reinstall sgl-kernel
pip install sgl-kernel==0.0.5 --force-reinstall --no-deps
pip install sgl-kernel==0.0.5.post1 --force-reinstall --no-deps