mirror of
https://github.com/BillyOutlast/flash-attention-prebuild-wheels-rocm.git
synced 2026-06-30 23:57:53 -04:00
docs: Update docs
This commit is contained in:
@@ -235,6 +235,7 @@ jobs:
|
||||
run: |
|
||||
git config --global user.name "github-actions[bot]"
|
||||
git config --global user.email "41898282+github-actions[bot]@users.noreply.github.com"
|
||||
git pull
|
||||
if git diff --quiet; then
|
||||
echo "No docs updates to commit."
|
||||
exit 0
|
||||
|
||||
+2
-2
@@ -55,11 +55,11 @@ echo " RAM: ${RAM_GB}GB"
|
||||
if [[ -z "${MAX_JOBS:-}" && -z "${NVCC_THREADS:-}" ]]; then
|
||||
# Calculate max product based on following constraints:
|
||||
# - MAX_JOBS x NVCC_THREADS(<= 4) <= NUM_THREADS
|
||||
# - 2.5GB x MAX_JOBS x NVCC_THREADS(<= 4) <= RAM_GB
|
||||
# - 2.8GB x MAX_JOBS x NVCC_THREADS(<= 4) <= RAM_GB
|
||||
|
||||
# Set MAX_PRODUCT from RAM
|
||||
MAX_PRODUCT_CPU=$NUM_THREADS
|
||||
MAX_PRODUCT_RAM=$(awk -v ram="$RAM_GB" 'BEGIN {print int(ram / 2.5)}')
|
||||
MAX_PRODUCT_RAM=$(awk -v ram="$RAM_GB" 'BEGIN {print int(ram / 2.8)}')
|
||||
MAX_PRODUCT=$((MAX_PRODUCT_CPU < MAX_PRODUCT_RAM ? MAX_PRODUCT_CPU : MAX_PRODUCT_RAM))
|
||||
|
||||
# Set MAX_JOBS and NVCC_THREADS so that MAX_JOBS x NVCC_THREADS ≈ MAX_PRODUCT with NVCC_THREADS <= 4
|
||||
|
||||
+110
-31
@@ -29,6 +29,10 @@
|
||||
- [Flash-Attention 2.8.3](#flash-attention-283)
|
||||
- [Flash-Attention 2.7.4](#flash-attention-274)
|
||||
- [Flash-Attention 2.6.3](#flash-attention-263)
|
||||
- [Manylinux2014 x86_64](#manylinux2014-x86_64)
|
||||
- [Flash-Attention 2.8.3](#flash-attention-283)
|
||||
- [Flash-Attention 2.7.4](#flash-attention-274)
|
||||
- [Flash-Attention 2.6.3](#flash-attention-263)
|
||||
- [Windows x86_64](#windows-x86_64)
|
||||
- [Flash-Attention 2.8.3](#flash-attention-283)
|
||||
- [Flash-Attention 2.8.2](#flash-attention-282)
|
||||
@@ -56,10 +60,10 @@
|
||||
| 3.9 | 2.8 | 12.6 | [Download1(v0.4.16)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.16/flash_attn-2.8.3+cu126torch2.8-cp39-cp39-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.9 | [Download1(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
@@ -74,7 +78,7 @@
|
||||
| 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download4(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
@@ -92,14 +96,14 @@
|
||||
| 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl), [Download4(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.9 | [Download1(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu126torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.11)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.11/flash_attn-2.8.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
@@ -108,6 +112,7 @@
|
||||
| 3.12 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download4(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download5(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 13.0 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.8.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.13 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.6 | 12.4 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu124torch2.6-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.6 | 12.6 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu126torch2.6-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.6 | 12.8 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.6-cp313-cp313-linux_x86_64.whl) |
|
||||
@@ -117,8 +122,8 @@
|
||||
| 3.13 | 2.7 | 12.8 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.7-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.4 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu124torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.6 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu126torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.8 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.9 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 12.6 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu126torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu126torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 12.8 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3+cu128torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3+cu128torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 13.0 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.8.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.5.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.2/flash_attn-2.8.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl), [Download3(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
@@ -314,32 +319,32 @@
|
||||
| ------ | ------- | ---- | ------- |
|
||||
| 3.10 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.8-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl), [Download4(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.5-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.8-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
@@ -357,15 +362,18 @@
|
||||
| 3.12 | 2.6 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.10)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.10/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.7.4+cu124torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.8 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.9 | [Download1(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu124torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.7.4+cu126torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.13 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 12.8 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu128torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 13.0 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu130torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.21)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.21/flash_attn-2.7.4+cu130torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.14 | 2.9 | 12.8 | [Download1(v0.6.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.8/flash_attn-2.7.4+cu128torch2.9-cp314-cp314-linux_x86_64.whl) |
|
||||
@@ -572,20 +580,20 @@
|
||||
| 3.10 | 2.5 | 12.1 | [Download1(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu121torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu121torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download7(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl), [Download8(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu124torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download5(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download4(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download5(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download6(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl), [Download7(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl), [Download4(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-linux_x86_64.whl), [Download3(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-linux_x86_64.whl) |
|
||||
@@ -616,15 +624,15 @@
|
||||
| 3.11 | 2.6 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download4(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download5(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download6(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download4(v0.3.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download5(v0.1.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.1.0/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download6(v0.0.9)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.9/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl), [Download7(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download4(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download4(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl), [Download5(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.9-cp311-cp311-linux_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.9-cp311-cp311-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp311-cp311-linux_x86_64.whl) |
|
||||
@@ -647,12 +655,12 @@
|
||||
| 3.12 | 2.5 | 12.1 | [Download1(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu121torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu121torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.0/flash_attn-2.6.3+cu121torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download7(v0.0.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.2/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download8(v0.0.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.1/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl), [Download9(v0.0.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.0/flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download3(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl), [Download6(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu124torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download4(v0.0.6)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.6/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl), [Download5(v0.0.5)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.5/flash_attn-2.6.3+cu126torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu128torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 11.8 | [Download1(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu118torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu118torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl), [Download2(v0.0.8)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.6.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl), [Download3(v0.0.7)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.7/flash_attn-2.6.3+cu126torch2.7-cp312-cp312-linux_x86_64.whl) |
|
||||
@@ -660,11 +668,13 @@
|
||||
| 3.12 | 2.8 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu124torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.8 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download3(v0.2.1)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.1/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl), [Download4(v0.2.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.2.0/flash_attn-2.6.3+cu128torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.9 | [Download1(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-linux_x86_64.whl), [Download2(v0.3.14)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.4 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu124torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.6 | [Download1(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download2(v0.5.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.4/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl), [Download3(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-linux_x86_64.whl) |
|
||||
| 3.13 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 12.6 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu126torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 12.8 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.6.3+cu128torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
| 3.13 | 2.9 | 13.0 | [Download1(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.6.3+cu130torch2.9-cp313-cp313-linux_x86_64.whl) |
|
||||
@@ -1061,11 +1071,16 @@
|
||||
|
||||
| Python | PyTorch | CUDA | package |
|
||||
| ------ | ------- | ---- | ------- |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu130torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.6-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.7-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.8.3+cu128torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu129torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
|
||||
</details>
|
||||
|
||||
@@ -1076,12 +1091,24 @@
|
||||
|
||||
| Python | PyTorch | CUDA | package |
|
||||
| ------ | ------- | ---- | ------- |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.7-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu128torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.7.4+cu130torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.6-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu129torch2.8-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
|
||||
</details>
|
||||
|
||||
@@ -1092,12 +1119,64 @@
|
||||
|
||||
| Python | PyTorch | CUDA | package |
|
||||
| ------ | ------- | ---- | ------- |
|
||||
| 3.10 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.10 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.6-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.8 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.8-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.8 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.8-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 12.8 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu128torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.9 | 13.0 | [Download1(v0.7.0)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.0/flash_attn-2.6.3+cu130torch2.9-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.6 | 12.9 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu129torch2.6-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.7 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.7-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
|
||||
</details>
|
||||
|
||||
## 🐧 Manylinux2014 x86_64
|
||||
|
||||
### Flash-Attention 2.8.3
|
||||
|
||||
<details>
|
||||
<summary>Packages for Flash-Attention 2.8.3</summary>
|
||||
|
||||
| Python | PyTorch | CUDA | package |
|
||||
| ------ | ------- | ---- | ------- |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.13 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.8.3+cu128torch2.5-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
|
||||
</details>
|
||||
|
||||
### Flash-Attention 2.7.4
|
||||
|
||||
<details>
|
||||
<summary>Packages for Flash-Attention 2.7.4</summary>
|
||||
|
||||
| Python | PyTorch | CUDA | package |
|
||||
| ------ | ------- | ---- | ------- |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.11 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.7.4+cu128torch2.5-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
|
||||
</details>
|
||||
|
||||
### Flash-Attention 2.6.3
|
||||
|
||||
<details>
|
||||
<summary>Packages for Flash-Attention 2.6.3</summary>
|
||||
|
||||
| Python | PyTorch | CUDA | package |
|
||||
| ------ | ------- | ---- | ------- |
|
||||
| 3.10 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
| 3.12 | 2.5 | 12.8 | [Download1(v0.7.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.7.2/flash_attn-2.6.3+cu128torch2.5-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl) |
|
||||
|
||||
</details>
|
||||
|
||||
|
||||
+70
-54
@@ -1,15 +1,36 @@
|
||||
## History
|
||||
|
||||
### v0.7.2
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.2)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------------- | ------------------ | ---------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.5, 2.6, 2.7, 2.8 | 12.8, 12.9 |
|
||||
|
||||
#### Manylinux 2_24 x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------------- | ------------- | ---------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.6, 2.7, 2.8 | 12.8, 12.9 |
|
||||
|
||||
#### Manylinux2014 x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------------- | ------- | ---- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.5 | 12.8 |
|
||||
|
||||
### v0.7.0
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.0)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.9 | 12.8, 13.0 |
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ------- | ---------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.9 | 12.8, 13.0 |
|
||||
|
||||
### v0.6.9
|
||||
|
||||
@@ -18,9 +39,8 @@
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.6.3 | 3.14 | 2.9 | 13.0 |
|
||||
|
||||
| --------------- | ------ | ------- | ---- |
|
||||
| 2.6.3 | 3.14 | 2.9 | 13.0 |
|
||||
|
||||
### v0.6.4
|
||||
|
||||
@@ -28,10 +48,9 @@
|
||||
|
||||
#### Linux arm64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 |
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------- |
|
||||
| 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 |
|
||||
|
||||
### v0.6.3
|
||||
|
||||
@@ -39,10 +58,9 @@
|
||||
|
||||
#### Linux arm64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.6.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 |
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------- |
|
||||
| 2.6.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 |
|
||||
|
||||
### v0.5.4
|
||||
|
||||
@@ -50,21 +68,19 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ----------------------- | ---------------------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8, 2.9 | 12.4, 12.6, 12.8, 13.0 |
|
||||
|
||||
|
||||
### v0.4.22
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.22)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.1 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.8, 13.0 |
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------------- | ------- | ---------- |
|
||||
| 2.8.1 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.8, 13.0 |
|
||||
|
||||
### v0.4.18
|
||||
|
||||
@@ -72,9 +88,9 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 13.0 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------------- | ------- | ---- |
|
||||
| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 13.0 |
|
||||
|
||||
### v0.4.17
|
||||
|
||||
@@ -82,9 +98,9 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------------- | ------- | ---------- |
|
||||
| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 |
|
||||
|
||||
### v0.4.16
|
||||
|
||||
@@ -92,9 +108,9 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.6.3, 2.8.3 | 3.9 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------------------ | ---------- |
|
||||
| 2.6.3, 2.8.3 | 3.9 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6 |
|
||||
|
||||
### v0.4.15
|
||||
|
||||
@@ -102,15 +118,15 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------- | ---------- |
|
||||
| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 |
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------- | ---- |
|
||||
| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6 |
|
||||
|
||||
### v0.4.12
|
||||
|
||||
@@ -118,15 +134,15 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.3 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------------- | ---------------------- |
|
||||
| 2.8.3 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 |
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.2 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------------- | ---------- |
|
||||
| 2.8.2 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6 |
|
||||
|
||||
### v0.4.11
|
||||
|
||||
@@ -134,9 +150,9 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------------- |
|
||||
| 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 |
|
||||
|
||||
### v0.4.10
|
||||
|
||||
@@ -144,9 +160,9 @@
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.7.4, 2.8.2 | 3.10, 3.11, 3.12 | 2.7, 2.8 | 12.8 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | -------- | ---- |
|
||||
| 2.7.4, 2.8.2 | 3.10, 3.11, 3.12 | 2.7, 2.8 | 12.8 |
|
||||
|
||||
### v0.4.9
|
||||
|
||||
@@ -155,8 +171,8 @@
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.7.4 | 3.11 | 2.7 | 12.8 |
|
||||
| --------------- | ------ | ------- | ---- |
|
||||
| 2.7.4 | 3.11 | 2.7 | 12.8 |
|
||||
|
||||
### v0.3.18
|
||||
|
||||
@@ -164,9 +180,9 @@
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.7.4 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.8, 12.9 |
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------- |
|
||||
| 2.7.4 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.8, 12.9 |
|
||||
|
||||
### v0.3.14
|
||||
|
||||
|
||||
Reference in New Issue
Block a user