[AMD] Support Wave attention backend with AMD GPU optimizations (#8660)
Signed-off-by: Stanley Winata <stanley.winata@amd.com> Signed-off-by: Harsh Menon <harsh@nod-labs.com> Signed-off-by: nithinsubbiah <nithinsubbiah@gmail.com> Signed-off-by: Ivan Butygin <ivan.butygin@gmail.com> Signed-off-by: xintin <gaurav.verma@amd.com> Co-authored-by: Harsh Menon <harsh@nod-labs.com> Co-authored-by: Stanley Winata <stanley.winata@amd.com> Co-authored-by: Stanley Winata <68087699+raikonenfnu@users.noreply.github.com> Co-authored-by: Stanley Winata <stanley@nod-labs.com> Co-authored-by: Ivan Butygin <ivan.butygin@gmail.com> Co-authored-by: nithinsubbiah <nithinsubbiah@gmail.com> Co-authored-by: Nithin Meganathan <18070964+nithinsubbiah@users.noreply.github.com> Co-authored-by: Ivan Butygin <ibutygin@amd.com>
This commit is contained in:
@@ -196,6 +196,8 @@ suite_amd = {
|
||||
TestFile("test_torch_native_attention_backend.py", 123),
|
||||
TestFile("test_triton_attention_backend.py", 150),
|
||||
# TestFile("test_vision_chunked_prefill.py", 175), # Disabled temporarily and track in #7701
|
||||
TestFile("test_wave_attention_kernels.py", 2),
|
||||
TestFile("test_wave_attention_backend.py", 150),
|
||||
],
|
||||
"per-commit-2-gpu-amd": [
|
||||
TestFile("lora/test_lora_tp.py", 116),
|
||||
|
||||
Reference in New Issue
Block a user