From d1b6fd99637898cd5cd6a7f4bb0816a2cd71eed5 Mon Sep 17 00:00:00 2001 From: Michael Melesse Date: Tue, 21 Jan 2025 15:09:39 -0800 Subject: [PATCH] target MI300 directly --- .github/workflows/amd_tests.yml | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/.github/workflows/amd_tests.yml b/.github/workflows/amd_tests.yml index 30711520a..f32baeb6a 100644 --- a/.github/workflows/amd_tests.yml +++ b/.github/workflows/amd_tests.yml @@ -27,7 +27,7 @@ jobs: id: set-matrix run: | if [ x"${{ github.repository }}" == x"ROCm/flash-attention" ]; then - echo '::set-output name=matrix-HIP::[["self-hosted", "gfx90a"]]' + echo '::set-output name=matrix-HIP::[["linux-mi300-gpu-1"]]' else echo '::set-output name=matrix-HIP::[["ubuntu-latest"]]' fi @@ -59,13 +59,13 @@ jobs: export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE" python setup.py install - name: Flash Attention Tests Using Reference Impl - if: matrix.runner[1] == 'gfx90a' + if: matrix.runner[0] == 'linux-mi300-gpu-1' run: | export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE" export FLASH_ATTENTION_TRITON_AMD_REF=1 pytest tests/test_flash_attn_triton_amd.py - name: Flash Attention CDNA Tests - if: matrix.runner[1] == 'gfx90a' + if: matrix.runner[0] == 'linux-mi300-gpu-1' run: | export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE" pytest tests/test_flash_attn_triton_amd.py @@ -75,17 +75,17 @@ jobs: export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE" pytest tests/test_flash_attn_triton_amd.py::test_flash_attn_output tests/test_flash_attn_triton_amd.py::test_flash_attn_varlen_output tests/test_flash_attn_triton_amd.py::test_flash_attn_kvcache - name: AMD Tests - if: matrix.runner[1] == 'gfx90a' + if: matrix.runner[0] == 'linux-mi300-gpu-1' run: | export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE" pytest -v -s flash_attn/flash_attn_triton_amd/test.py - name: AMD Bench - if: matrix.runner[1] == 'gfx90a' + if: matrix.runner[0] == 'linux-mi300-gpu-1' run: | export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE" python flash_attn/flash_attn_triton_amd/bench.py - name: AMD Bench with Autotune - if: matrix.runner[1] == 'gfx90a' + if: matrix.runner[0] == 'linux-mi300-gpu-1' run: | export FLASH_ATTENTION_TRITON_AMD_ENABLE="TRUE" export FLASH_ATTENTION_TRITON_AMD_AUTOTUNE=1