mirror of
https://github.com/BillyOutlast/flash-attention-prebuild-wheels-rocm.git
synced 2026-07-01 01:27:54 -04:00
ab165f3f22
- Move auditwheel repair after initial release upload with continue-on-error to allow pipeline continuation - Add manylinux platform normalization support in normalize_platform_name() - Expand self-hosted build matrix to include Python 3.14 and Flash Attention 2.8.3 - Improve wheel upload flow by separating regular and manylinux wheel handling
204 lines
4.6 KiB
Python
204 lines
4.6 KiB
Python
import json
|
|
|
|
EXCLUDE = [
|
|
# torch < 2.2 does not support Python 3.12
|
|
{"python-version": "3.12", "torch-version": "2.0.1"},
|
|
{"python-version": "3.12", "torch-version": "2.1.2"},
|
|
# torch 2.0.1 does not support CUDA 12.x
|
|
{"torch-version": "2.0.1", "cuda-version": "12.1"},
|
|
{"torch-version": "2.0.1", "cuda-version": "12.4"},
|
|
{"torch-version": "2.0.1", "cuda-version": "12.6"},
|
|
{"torch-version": "2.0.1", "cuda-version": "12.8"},
|
|
# torch 2.6.0 does not support CUDA 12.1
|
|
{"torch-version": "2.6.0", "cuda-version": "12.1"},
|
|
# torch 2.7.0 does not support CUDA 12.4
|
|
{"torch-version": "2.7.0", "cuda-version": "12.4"},
|
|
# torch < 2.8 does not support CUDA 12.9
|
|
{"torch-version": "2.5.1", "cuda-version": "12.9"},
|
|
{"torch-version": "2.6.3", "cuda-version": "12.9"},
|
|
{"torch-version": "2.7.1", "cuda-version": "12.9"},
|
|
# torch >= 2.9 does not support Python 3.9
|
|
{"torch-version": "2.9.1", "python-version": "3.9"},
|
|
# torch < 2.9 does not support CUDA 13.0
|
|
{"torch-version": "2.5.1", "cuda-version": "13.0"},
|
|
{"torch-version": "2.6.0", "cuda-version": "13.0"},
|
|
{"torch-version": "2.7.1", "cuda-version": "13.0"},
|
|
{"torch-version": "2.8.1", "cuda-version": "13.0"},
|
|
{"torch-version": "2.8.0", "cuda-version": "13.0"},
|
|
# Python 3.14 is supported from torch 2.9
|
|
{"torch-version": "2.5.1", "python-version": "3.14"},
|
|
{"torch-version": "2.6.3", "python-version": "3.14"},
|
|
{"torch-version": "2.7.1", "python-version": "3.14"},
|
|
{"torch-version": "2.8.0", "python-version": "3.14"},
|
|
]
|
|
|
|
LINUX_MATRIX = {
|
|
"flash-attn-version": [
|
|
"2.6.3",
|
|
"2.7.4",
|
|
"2.8.3",
|
|
],
|
|
"python-version": [
|
|
"3.10",
|
|
"3.11",
|
|
"3.12",
|
|
"3.13",
|
|
],
|
|
"torch-version": [
|
|
"2.5.1",
|
|
"2.6.0",
|
|
"2.7.1",
|
|
"2.8.0",
|
|
"2.9.1",
|
|
],
|
|
"cuda-version": [
|
|
"12.4",
|
|
# "12.6",
|
|
"12.8",
|
|
# "12.9",
|
|
"13.0",
|
|
],
|
|
}
|
|
|
|
LINUX_ARM64_MATRIX = {
|
|
"flash-attn-version": [
|
|
# "2.6.3",
|
|
"2.7.4",
|
|
"2.8.3",
|
|
],
|
|
"python-version": [
|
|
"3.10",
|
|
"3.11",
|
|
"3.12",
|
|
# "3.13",
|
|
],
|
|
"torch-version": [
|
|
"2.5.1",
|
|
"2.6.0",
|
|
"2.7.1",
|
|
# "2.8.0",
|
|
"2.9.1",
|
|
],
|
|
"cuda-version": [
|
|
"12.4",
|
|
# "12.6",
|
|
"12.8",
|
|
# "12.9",
|
|
"13.0",
|
|
],
|
|
}
|
|
|
|
LINUX_SELF_HOSTED_MATRIX = {
|
|
"flash-attn-version": [
|
|
"2.7.4",
|
|
"2.8.3",
|
|
],
|
|
"python-version": [
|
|
"3.10",
|
|
"3.11",
|
|
"3.12",
|
|
"3.13",
|
|
"3.14",
|
|
],
|
|
"torch-version": ["2.9.1"],
|
|
"cuda-version": [
|
|
"12.8",
|
|
"13.0",
|
|
],
|
|
}
|
|
|
|
LINUX_ARM64_SELF_HOSTED_MATRIX = {
|
|
"flash-attn-version": [
|
|
# "2.6.3",
|
|
"2.7.4",
|
|
# "2.8.3",
|
|
],
|
|
"python-version": [
|
|
"3.10",
|
|
"3.11",
|
|
"3.12",
|
|
# "3.13",
|
|
],
|
|
"torch-version": [
|
|
"2.5.1",
|
|
"2.6.0",
|
|
"2.7.1",
|
|
# "2.8.0",
|
|
"2.9.1",
|
|
],
|
|
"cuda-version": [
|
|
"12.4",
|
|
# "12.6",
|
|
"12.8",
|
|
# "12.9",
|
|
"13.0",
|
|
],
|
|
}
|
|
|
|
WINDOWS_MATRIX = {
|
|
"flash-attn-version": [
|
|
"2.6.3",
|
|
# "2.7.4",
|
|
# "2.8.3",
|
|
],
|
|
"python-version": [
|
|
"3.10",
|
|
"3.11",
|
|
"3.12",
|
|
# "3.13",
|
|
],
|
|
"torch-version": [
|
|
"2.5.1",
|
|
"2.6.0",
|
|
"2.7.1",
|
|
"2.8.0",
|
|
"2.9.1",
|
|
],
|
|
"cuda-version": [
|
|
"12.4",
|
|
# "12.6",
|
|
"12.8",
|
|
# "12.9",
|
|
"13.0",
|
|
],
|
|
}
|
|
|
|
WINDOWS_CODEBUILD_MATRIX = {
|
|
"flash-attn-version": ["2.6.3", "2.7.4.post1", "2.8.3"],
|
|
"python-version": ["3.10", "3.11", "3.12", "3.13"],
|
|
"torch-version": ["2.9.1"],
|
|
"cuda-version": ["13.0"],
|
|
}
|
|
|
|
|
|
def main():
|
|
print(
|
|
json.dumps(
|
|
{
|
|
"linux": False,
|
|
# "linux": LINUX_MATRIX,
|
|
#
|
|
"linux_arm64": False,
|
|
# "linux_arm64": LINUX_ARM64_MATRIX,
|
|
#
|
|
# "linux_self_hosted": False,
|
|
"linux_self_hosted": LINUX_SELF_HOSTED_MATRIX,
|
|
#
|
|
# "linux_arm64_self_hosted": False,
|
|
# "linux_arm64_self_hosted": LINUX_ARM64_SELF_HOSTED_MATRIX,
|
|
#
|
|
"windows": False,
|
|
# "windows": WINDOWS_MATRIX,
|
|
#
|
|
"windows_code_build": False,
|
|
# "windows_code_build": WINDOWS_CODEBUILD_MATRIX,
|
|
#
|
|
"exclude": EXCLUDE,
|
|
}
|
|
)
|
|
)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|