From 603aa0a66d009288fa6a19c0bd2f0a1eb84d8e06 Mon Sep 17 00:00:00 2001 From: Junya Morioka Date: Tue, 23 Dec 2025 16:38:52 +0900 Subject: [PATCH] docs: Update docs --- .github/workflows/build.yml | 1 + build_linux.sh | 4 +- docs/packages.md | 141 ++++++++++++++++++++++++++++-------- docs/release_history.md | 124 +++++++++++++++++-------------- 4 files changed, 183 insertions(+), 87 deletions(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index a8286bf..eb3bdf8 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -235,6 +235,7 @@ jobs: run: | git config --global user.name "github-actions[bot]" git config --global user.email "41898282+github-actions[bot]@users.noreply.github.com" + git pull if git diff --quiet; then echo "No docs updates to commit." exit 0 diff --git a/build_linux.sh b/build_linux.sh index 99dcf6a..49b9cb3 100755 --- a/build_linux.sh +++ b/build_linux.sh @@ -55,11 +55,11 @@ echo " RAM: ${RAM_GB}GB" if [[ -z "${MAX_JOBS:-}" && -z "${NVCC_THREADS:-}" ]]; then # Calculate max product based on following constraints: # - MAX_JOBS x NVCC_THREADS(<= 4) <= NUM_THREADS - # - 2.5GB x MAX_JOBS x NVCC_THREADS(<= 4) <= RAM_GB + # - 2.8GB x MAX_JOBS x NVCC_THREADS(<= 4) <= RAM_GB # Set MAX_PRODUCT from RAM MAX_PRODUCT_CPU=$NUM_THREADS - MAX_PRODUCT_RAM=$(awk -v ram="$RAM_GB" 'BEGIN {print int(ram / 2.5)}') + MAX_PRODUCT_RAM=$(awk -v ram="$RAM_GB" 'BEGIN {print int(ram / 2.8)}') MAX_PRODUCT=$((MAX_PRODUCT_CPU < MAX_PRODUCT_RAM ? MAX_PRODUCT_CPU : MAX_PRODUCT_RAM)) # Set MAX_JOBS and NVCC_THREADS so that MAX_JOBS x NVCC_THREADS ≈ MAX_PRODUCT with NVCC_THREADS <= 4 diff --git a/docs/packages.md b/docs/packages.md index 9423dfc..fb551f0 100644 --- a/docs/packages.md +++ b/docs/packages.md @@ -29,6 +29,10 @@ - [Flash-Attention 2.8.3](#flash-attention-283) - [Flash-Attention 2.7.4](#flash-attention-274) - [Flash-Attention 2.6.3](#flash-attention-263) +- [Manylinux2014 x86_64](#manylinux2014-x86_64) + - [Flash-Attention 2.8.3](#flash-attention-283) + - [Flash-Attention 2.7.4](#flash-attention-274) + - [Flash-Attention 2.6.3](#flash-attention-263) - [Windows x86_64](#windows-x86_64) - [Flash-Attention 2.8.3](#flash-attention-283) - [Flash-Attention 2.8.2](#flash-attention-282) @@ -56,10 +60,10 @@ | 3.9 | 2.8 | 12.6 | [Download1(v0.4.16)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.16/flash_attn-2.8.3+cu126torch2.8-cp39-cp39-linux_x86_64.whl) | | 3.10 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 12.9 | [Download1(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl) | @@ -74,7 +78,7 @@ | 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download4(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl) | | 3.11 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.5-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.5-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl) | @@ -92,14 +96,14 @@ | 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl), [Download4(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl) | | 3.12 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.6 | 12.9 | [Download1(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.7 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.8-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl) | @@ -108,6 +112,7 @@ | 3.12 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download4(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download5(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 13.0 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl) | +| 3.13 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.6 | 12.4 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu124torch2.6-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.6 | 12.6 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu126torch2.6-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.6 | 12.8 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.6-cp313-cp313-linux_x86_64.whl) | @@ -117,8 +122,8 @@ | 3.13 | 2.7 | 12.8 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.7-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.8 | 12.4 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu124torch2.8-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.8 | 12.6 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu126torch2.8-cp313-cp313-linux_x86_64.whl) | -| 3.13 | 2.8 | 12.8 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-linux_x86_64.whl) | -| 3.13 | 2.8 | 12.9 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-linux_x86_64.whl) | +| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-linux_x86_64.whl) | +| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 12.6 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu126torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu126torch2.9-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 12.8 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu128torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu128torch2.9-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 13.0 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.5.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.2/flash_attn-2.8.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl), [Download3(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl) | @@ -314,32 +319,32 @@ | ------ | ------- | ---- | ------- | | 3.10 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.5-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.5-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.5 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.6-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.6 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.6 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.7-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.7-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.7 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.8-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.8-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.8-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.8 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.8 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.9-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.9-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download4(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl) | | 3.11 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.5-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.5-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.5-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.5 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.6-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.6 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.7-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.7-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.7 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.8-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.8-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.8-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.8 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp311-cp311-linux_x86_64.whl) | @@ -357,15 +362,18 @@ | 3.12 | 2.6 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.7-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.7 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.8-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.8-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.8 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.8 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-linux_x86_64.whl) | +| 3.13 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp313-cp313-linux_x86_64.whl) | +| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp313-cp313-linux_x86_64.whl) | +| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 12.8 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu128torch2.9-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 13.0 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu130torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu130torch2.9-cp313-cp313-linux_x86_64.whl) | | 3.14 | 2.9 | 12.8 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp314-cp314-linux_x86_64.whl) | @@ -572,20 +580,20 @@ | 3.10 | 2.5 | 12.1 | [Download1(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu121torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu121torch2.5-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download7(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download8(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.6 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.7 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.7-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.7 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download4(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download5(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download7(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.8-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.8-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download4(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl) | -| 3.10 | 2.8 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-linux_x86_64.whl) | +| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.9-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp310-cp310-linux_x86_64.whl) | | 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-linux_x86_64.whl) | @@ -616,15 +624,15 @@ | 3.11 | 2.6 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.6 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.7 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.7-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.7-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.7-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.7 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download5(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download6(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download4(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download5(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download6(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download7(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.8-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.8-cp311-cp311-linux_x86_64.whl) | -| 3.11 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download4(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl) | +| 3.11 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download4(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download5(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.8 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.9-cp311-cp311-linux_x86_64.whl) | | 3.11 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.9-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp311-cp311-linux_x86_64.whl) | @@ -647,12 +655,12 @@ | 3.12 | 2.5 | 12.1 | [Download1(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu121torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu121torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.0/flash_attn-2.6.3+cu121torch2.5-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download7(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download8(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download9(v0.0.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.0/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.6 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.6 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.7 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.7-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl) | @@ -660,11 +668,13 @@ | 3.12 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.8-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download4(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl) | -| 3.12 | 2.8 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-linux_x86_64.whl) | +| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl) | | 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl) | +| 3.13 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp313-cp313-linux_x86_64.whl) | +| 3.13 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 12.6 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 12.8 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu128torch2.9-cp313-cp313-linux_x86_64.whl) | | 3.13 | 2.9 | 13.0 | [Download1(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.6.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl) | @@ -1061,11 +1071,16 @@ | Python | PyTorch | CUDA | package | | ------ | ------- | ---- | ------- | +| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.11 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | @@ -1076,12 +1091,24 @@ | Python | PyTorch | CUDA | package | | ------ | ------- | ---- | ------- | +| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.11 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | @@ -1092,12 +1119,64 @@ | Python | PyTorch | CUDA | package | | ------ | ------- | ---- | ------- | +| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.11 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | | 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) | + + + +## 🐧 Manylinux2014 x86_64 + +### Flash-Attention 2.8.3 + +
+Packages for Flash-Attention 2.8.3 + +| Python | PyTorch | CUDA | package | +| ------ | ------- | ---- | ------- | +| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) | +| 3.13 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) | + +
+ +### Flash-Attention 2.7.4 + +
+Packages for Flash-Attention 2.7.4 + +| Python | PyTorch | CUDA | package | +| ------ | ------- | ---- | ------- | +| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) | +| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) | + +
+ +### Flash-Attention 2.6.3 + +
+Packages for Flash-Attention 2.6.3 + +| Python | PyTorch | CUDA | package | +| ------ | ------- | ---- | ------- | +| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) | +| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
diff --git a/docs/release_history.md b/docs/release_history.md index b4a88b4..e3c9c56 100644 --- a/docs/release_history.md +++ b/docs/release_history.md @@ -1,15 +1,36 @@ ## History +### v0.7.2 + +[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.2) + +#### Linux x86_64 + +| Flash-Attention | Python | PyTorch | CUDA | +| ------------------- | ---------------------- | ------------------ | ---------- | +| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.5, 2.6, 2.7, 2.8 | 12.8, 12.9 | + +#### Manylinux 2_24 x86_64 + +| Flash-Attention | Python | PyTorch | CUDA | +| ------------------- | ---------------------- | ------------- | ---------- | +| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.6, 2.7, 2.8 | 12.8, 12.9 | + +#### Manylinux2014 x86_64 + +| Flash-Attention | Python | PyTorch | CUDA | +| ------------------- | ---------------------- | ------- | ---- | +| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.5 | 12.8 | + ### v0.7.0 [Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.0) #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.9 | 12.8, 13.0 | - +| Flash-Attention | Python | PyTorch | CUDA | +| ------------------- | ---------------- | ------- | ---------- | +| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.9 | 12.8, 13.0 | ### v0.6.9 @@ -18,9 +39,8 @@ #### Linux x86_64 | Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.6.3 | 3.14 | 2.9 | 13.0 | - +| --------------- | ------ | ------- | ---- | +| 2.6.3 | 3.14 | 2.9 | 13.0 | ### v0.6.4 @@ -28,10 +48,9 @@ #### Linux arm64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 | - +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------- | ------------------ | ---------------- | +| 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 | ### v0.6.3 @@ -39,10 +58,9 @@ #### Linux arm64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.6.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 | - +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------- | ------------------ | ---------------- | +| 2.6.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 | ### v0.5.4 @@ -50,21 +68,19 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | +| Flash-Attention | Python | PyTorch | CUDA | +| ------------------- | ---------------- | ----------------------- | ---------------------- | | 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8, 2.9 | 12.4, 12.6, 12.8, 13.0 | - ### v0.4.22 [Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.22) #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.8.1 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.8, 13.0 | - +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------------- | ------- | ---------- | +| 2.8.1 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.8, 13.0 | ### v0.4.18 @@ -72,9 +88,9 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 13.0 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------------- | ------- | ---- | +| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 13.0 | ### v0.4.17 @@ -82,9 +98,9 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------------- | ------- | ---------- | +| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 | ### v0.4.16 @@ -92,9 +108,9 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.6.3, 2.8.3 | 3.9 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ------ | ------------------ | ---------- | +| 2.6.3, 2.8.3 | 3.9 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6 | ### v0.4.15 @@ -102,15 +118,15 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------- | ------- | ---------- | +| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 | #### Windows x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------- | ------- | ---- | +| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6 | ### v0.4.12 @@ -118,15 +134,15 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.8.3 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ------ | ------------- | ---------------------- | +| 2.8.3 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 | #### Windows x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.8.2 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ------ | ------------- | ---------- | +| 2.8.2 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6 | ### v0.4.11 @@ -134,9 +150,9 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------- | ------------------ | ---------------------- | +| 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 | ### v0.4.10 @@ -144,9 +160,9 @@ #### Windows x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.7.4, 2.8.2 | 3.10, 3.11, 3.12 | 2.7, 2.8 | 12.8 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------- | -------- | ---- | +| 2.7.4, 2.8.2 | 3.10, 3.11, 3.12 | 2.7, 2.8 | 12.8 | ### v0.4.9 @@ -155,8 +171,8 @@ #### Windows x86_64 | Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.7.4 | 3.11 | 2.7 | 12.8 | +| --------------- | ------ | ------- | ---- | +| 2.7.4 | 3.11 | 2.7 | 12.8 | ### v0.3.18 @@ -164,9 +180,9 @@ #### Linux x86_64 -| Flash-Attention | Python | PyTorch | CUDA | -| --- | --- | --- | --- | -| 2.7.4 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.8, 12.9 | +| Flash-Attention | Python | PyTorch | CUDA | +| --------------- | ---------------- | ------------------ | ---------------- | +| 2.7.4 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.8, 12.9 | ### v0.3.14