diff --git a/.github/workflows/amd-ci.yml b/.github/workflows/amd-ci.yml index e43020f31..3539fe742 100644 --- a/.github/workflows/amd-ci.yml +++ b/.github/workflows/amd-ci.yml @@ -56,22 +56,32 @@ jobs: - name: Check Docker Version run: docker version - - name: Setup Dependencies + - name: Check System Environment run: | - python3 -m pip uninstall -y torch torchvision - python3 -m pip install --pre \ - torch==2.6.0.dev20241113+rocm6.2 \ - 'setuptools-scm>=8' \ - torchvision==0.20.0.dev20241113+rocm6.2 \ - --extra-index-url https://download.pytorch.org/whl/nightly/rocm6.2 - python3 -m pip install triton==3.1.0 transformers==4.46.3 - python3 -m pip install -e .[dev] - - - name: Run Unit Tests + sudo apt list | grep hip + sudo apt list | grep rocm + + - name: Check Python Environment run: | - python3 -m pip list | grep torch - make test - make test-convergence + python3 -m pip list + + + # - name: Setup Dependencies + # run: | + # python3 -m pip uninstall -y torch torchvision + # python3 -m pip install --pre \ + # torch==2.6.0.dev20241113+rocm6.2 \ + # 'setuptools-scm>=8' \ + # torchvision==0.20.0.dev20241113+rocm6.2 \ + # --extra-index-url https://download.pytorch.org/whl/nightly/rocm6.2 + # python3 -m pip install triton==3.1.0 transformers==4.46.3 + # python3 -m pip install -e .[dev] + + # - name: Run Unit Tests + # run: | + # python3 -m pip list | grep torch + # make test + # make test-convergence # - name: Build Liger-Kernel CI Docker image # run: sudo docker build -t liger-kernel-ci -f Dockerfile.rocm .