forked from flashinfer-ai/flashinfer
-
Notifications
You must be signed in to change notification settings - Fork 0
109 lines (96 loc) · 3.03 KB
/
release_wheel.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
# Adapted from https://github.com/punica-ai/punica/blob/591b59899f0a20760821785d06b331c8a2e5cb86/.github/workflows/release_wheel.yml
name: Release
on:
workflow_dispatch:
inputs:
tag_name:
required: true
type: string
workflow_call:
inputs:
tag_name:
required: true
type: string
secrets:
WHL_TOKEN:
required: true
# PYPI_TEST_TOKEN:
# required: true
env:
TORCH_CUDA_ARCH_LIST: "7.5 8.0 8.9 9.0+PTX"
jobs:
build:
strategy:
fail-fast: false
matrix:
cuda: ["11.8", "12.1", "12.4"]
torch: ["2.2", "2.3", "2.4"]
exclude: # for cuda 12.4, we only support torch 2.4+
- cuda: "12.4"
torch: "2.2"
- cuda: "12.4"
torch: "2.3"
runs-on: [self-hosted]
steps:
- uses: actions/checkout@v4
with:
submodules: true
- name: Build wheel
run: |
chown -R $CI_UID:$CI_GID "$GITHUB_WORKSPACE"
docker run --rm -t \
-v "$CI_RUNNER_CACHE_DIR":/ci-cache \
-v "$GITHUB_WORKSPACE":/app \
-e FLASHINFER_CI_CUDA_VERSION=${{ matrix.cuda }} \
-e FLASHINFER_CI_TORCH_VERSION=${{ matrix.torch }} \
-e TORCH_CUDA_ARCH_LIST="$TORCH_CUDA_ARCH_LIST" \
-e MAX_JOBS=128 \
--user $CI_UID:$CI_GID \
pytorch/manylinux-builder:cuda${{ matrix.cuda }} \
bash /app/scripts/run-ci-build-wheel.sh
timeout-minutes: 120
- run: du -h dist/*
- uses: actions/upload-artifact@v4
with:
name: wheel-cuda${{ matrix.cuda }}-torch${{ matrix.torch }}
path: dist/*
release:
needs: build
runs-on: [self-hosted]
steps:
- uses: actions/download-artifact@v4
with:
path: dist/
merge-multiple: true
pattern: wheel-*
- run: ls -lah dist/
- uses: softprops/action-gh-release@v1
with:
tag_name: ${{ inputs.tag_name }}
files: |
dist/flashinfer*.whl
- uses: softprops/action-gh-release@v1
with:
tag_name: ${{ inputs.tag_name }}
files: |
dist/flashinfer-*.tar.gz
- name: Clone wheel index
run: git clone https://oauth2:${WHL_TOKEN}@github.com/flashinfer-ai/whl.git flashinfer-whl
env:
WHL_TOKEN: ${{ secrets.WHL_TOKEN }}
- name: Update wheel index
run: python3 scripts/update_whl_index.py
- name: Push wheel index
run: |
cd flashinfer-whl
git config --local user.name "github-actions[bot]"
git config --local user.email "41898282+github-actions[bot]@users.noreply.github.com"
git add -A
git commit -m "update whl"
git push
# - name: Upload sdist to pypi
# run: |
# pip install twine
# python -m twine upload --repository testpypi --username=__token__ dist/*.tar.gz
# env:
# TWINE_PASSWORD: ${{ secrets.PYPI_TEST_TOKEN }}