-
Notifications
You must be signed in to change notification settings - Fork 252
100 lines (82 loc) · 2.43 KB
/
amd-ci.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
name: GitHub Actions CI (AMD)
on:
push:
branches:
- main
paths:
- "src/**"
- "test/**"
pull_request:
branches:
- main
# paths:
# - "src/**"
# - "test/**"
concurrency:
# This causes it to cancel previous in-progress actions on the same PR / branch,
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
cancel-in-progress: true
jobs:
checkstyle:
runs-on: ubuntu-latest
steps:
- name: Checkout code
uses: actions/checkout@v3
- name: Set up Python
uses: actions/setup-python@v3
with:
python-version: '3.10'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install flake8 isort black
- name: Run checkstyle
run: make checkstyle
tests:
runs-on: linux-mi300-gpu-1
needs: [checkstyle]
steps:
- name: Checkout code
uses: actions/checkout@v3
- name: Set up Python
uses: actions/setup-python@v3
with:
python-version: '3.10'
- name: Check Docker Version
run: docker version
- name: Check System Environment
run: |
sudo apt list | grep hip
sudo apt list | grep rocm
- name: Check Python Environment
run: |
python3 -m pip list
# - name: Setup Dependencies
# run: |
# python3 -m pip uninstall -y torch torchvision
# python3 -m pip install --pre \
# torch==2.6.0.dev20241113+rocm6.2 \
# 'setuptools-scm>=8' \
# torchvision==0.20.0.dev20241113+rocm6.2 \
# --extra-index-url https://download.pytorch.org/whl/nightly/rocm6.2
# python3 -m pip install triton==3.1.0 transformers==4.46.3
# python3 -m pip install -e .[dev]
# - name: Run Unit Tests
# run: |
# python3 -m pip list | grep torch
# make test
# make test-convergence
# - name: Build Liger-Kernel CI Docker image
# run: sudo docker build -t liger-kernel-ci -f Dockerfile.rocm .
# - name: Run the tests
# run: |
# sudo docker run \
# --network=host \
# --group-add=video \
# --ipc=host \
# --cap-add=SYS_PTRACE \
# --security-opt seccomp=unconfined \
# --device /dev/kfd \
# --device /dev/dri \
# liger-kernel-ci \
# /bin/bash -c "make test; make test-convergence"