Skip to content

Commit

Permalink
Merge branch 'upstream_pr' of https://github.com/ROCm/xformers into u…
Browse files Browse the repository at this point in the history
…pstream_pr
  • Loading branch information
qianfengz committed Aug 20, 2024
2 parents d293caf + db2b52e commit 8eb1bbd
Show file tree
Hide file tree
Showing 2 changed files with 29 additions and 63 deletions.
83 changes: 23 additions & 60 deletions .github/workflows/rocm_ci.yml
Original file line number Diff line number Diff line change
Expand Up @@ -3,28 +3,14 @@ name: ROCM_CI
on:
pull_request:
types: [labeled, synchronize, reopened]
workflow_dispatch:
inputs:
logLevel:
description: 'Log level'
required: true
default: 'warning'
schedule:
- cron: "15 1 * * *"

jobs:
build:
runs-on: self-hosted
container:
image: 'rocm/pytorch-nightly:latest'
options: ' --cap-add=SYS_PTRACE --security-opt seccomp=unconfined --device=/dev/kfd --device=/dev/dri --group-add video --ipc=host --shm-size 8G '
if: contains(github.event.label.name, 'rocm')
runs-on: rocm

steps:
- uses: actions/checkout@v4
with:
path: '_xformers'
submodules: 'recursive'
set-safe-directory: true
fetch-depth: 0
- uses: actions/checkout@v2
- name: Get CPU info on Ubuntu
if: contains(runner.os, 'linux')
run: |
Expand All @@ -49,60 +35,37 @@ jobs:
export ROCM_PATH=/opt/rocm
echo ROCM_PATH = $ROCM_PATH
export MAX_JOBS=64
echo MAX_JOBS = $MAX_JOBS
hipcc --version
rocm-smi
rocminfo | grep "gfx"
- name: Setup build env
run: |
conda create -n xformers python=3.11
export PATH=/opt/conda/envs/xformers/bin:$PATH
python -VV
python -m pip install -U torch --index-url=https://download.pytorch.org/whl/nightly/rocm6.1
python -c "import torch; print(f'PyTorch version {torch.__version__}')"
python -m pip install ninja scipy pytest pytest-html
- name: Pre-build clean
- name: Build XFormers
run: |
cd _xformers
git clean -ffdx
cd ..
git clone --recursive -b $GIT_BRANCH $GITHUB_REPOSITORY
docker run -it --cap-add=SYS_PTRACE --security-opt seccomp=unconfined --device=/dev/kfd --device=/dev/dri --group-add video --ipc=host --shm-size 8G -v $PWD/xformers:/xformers rocm/pytorch-nightly:latest
- name: Build xformers
run: |
export PATH=/opt/conda/envs/xformers/bin:$PATH
export MAX_JOBS=144
python -m pip install -e ./_xformers --verbose
python -m xformers.info
pip3 install --upgrade pip
pip3 uninstall -y xformers
MAX_JOBS=$MAX_JOBS pip3 install -e /xformers --verbose
pip3 install scipy==1.10
python3 -c "import torch; print(torch.__version__)"
python3 -m xformers.info
- name: Run python tests
run: |
export PATH=/opt/conda/envs/xformers/bin:$PATH
python -m pytest --html=test_mem_eff_attention.html --self-contained-html -rpfs ./_xformers/tests/test_mem_eff_attention.py -k "not flshatt"
pytest -rpfs /xformers/tests/test_mem_eff_attention.py | tee test_mem_eff_attention.log
- name: Archive logs
if: '!cancelled()'
uses: actions/upload-artifact@v4
uses: actions/upload-artifact@v3
with:
name: test results
path: test_mem_eff_attention.html
path: test_mem_eff_attention_ck.log

- name: Post-build clean
if: '!cancelled()'
- name: Process test results
run: |
cd _xformers
git clean -ffdx
cd ..
clean:
runs-on: self-hosted
if: ${{ always() }}
needs: [build]
steps:
- name: Remove dangling Docker images
run: |
docker images -q -f dangling=true | xargs --no-run-if-empty docker rmi
echo "Processing test results TBD"
9 changes: 6 additions & 3 deletions tests/test_mem_eff_attention.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,13 +38,16 @@
if torch.cuda.is_available():
compute_capability = torch.cuda.get_device_capability("cuda")
sm70_or_better_only = pytest.mark.skipif(
torch.version.cuda is not None and compute_capability < (7, 0), reason="requires sm70+"
torch.version.cuda is not None and compute_capability < (7, 0),
reason="requires sm70+",
)
sm75_or_better_only = pytest.mark.skipif(
torch.version.cuda is not None and compute_capability < (7, 5), reason="requires sm75+"
torch.version.cuda is not None and compute_capability < (7, 5),
reason="requires sm75+",
)
sm80_or_better_only = pytest.mark.skipif(
torch.version.cuda is not None and compute_capability < (8, 0), reason="requires sm80+"
torch.version.cuda is not None and compute_capability < (8, 0),
reason="requires sm80+",
)
skip_if_rocm = pytest.mark.skipif(
torch.version.hip is not None, reason="not supported on ROCm"
Expand Down

0 comments on commit 8eb1bbd

Please sign in to comment.