mirror of
https://github.com/BillyOutlast/flash-attention-prebuild-wheels-rocm.git
synced 2026-07-01 01:27:54 -04:00
92464a9b3b
- Change wheel output to use full path instead of basename for better flexibility - Add patchelf to build dependencies for wheel repair operations - Enable auditwheel repair step with proper exclusions for CUDA/torch libraries - Separate wheel path variable to track both standard and manylinux versions - Rename manylinux workflow file to reflect its dedicated purpose - Update workflow references to use renamed manylinux workflow - Use fromjson() for runner parameter parsing in ARM build workflow - Update test workflows to use container environment consistently - Support both manylinux and standard wheel uploads to releases
31 lines
1022 B
YAML
31 lines
1022 B
YAML
name: Test self-hosted Linux build
|
|
|
|
on:
|
|
workflow_dispatch:
|
|
|
|
jobs:
|
|
# #########################################################
|
|
# Build wheels with self-hosted runner
|
|
# #########################################################
|
|
build_wheels_self_hosted:
|
|
name: Build wheels and Upload (Linux x86_64, self-hosted runner)
|
|
uses: ./.github/workflows/_build_linux_self_host.yml
|
|
strategy:
|
|
fail-fast: false
|
|
matrix:
|
|
flash-attn-version: ["2.8.3"]
|
|
python-version: ["3.13"]
|
|
torch-version: ["2.9.1"]
|
|
# https://developer.nvidia.com/cuda-toolkit-archive
|
|
cuda-version: ["13.0.1"]
|
|
# runner: ['["openci-runner-beta"]']
|
|
runner: ['["self-hosted", "x64"]']
|
|
with:
|
|
flash-attn-version: ${{ matrix.flash-attn-version }}
|
|
python-version: ${{ matrix.python-version }}
|
|
torch-version: ${{ matrix.torch-version }}
|
|
cuda-version: ${{ matrix.cuda-version }}
|
|
is-upload: false
|
|
runner: ${{ matrix.runner}}
|
|
use-container: true
|