From 34b36b749c8ed7cbfcf53e3b7b7c049faf6453a4 Mon Sep 17 00:00:00 2001 From: "github-actions[bot]" <41898282+github-actions[bot]@users.noreply.github.com> Date: Sat, 6 Dec 2025 15:21:57 +0000 Subject: [PATCH] docs: update docs for v0.6.4 --- docs/packages.md | 49 +++++++++++++++++++++++++++++++++++++++++ docs/release_history.md | 11 +++++++++ 2 files changed, 60 insertions(+) diff --git a/docs/packages.md b/docs/packages.md index 16bf79c..ee62bd4 100644 --- a/docs/packages.md +++ b/docs/packages.md @@ -22,6 +22,8 @@ - [Flash-Attention 2.4.3](#flash-attention-243) - [Flash-Attention 1.0.9](#flash-attention-109) - [Linux arm64](#linux-arm64) + - [Flash-Attention 2.8.3](#flash-attention-283) + - [Flash-Attention 2.7.4](#flash-attention-274) - [Flash-Attention 2.6.3](#flash-attention-263) - [Windows x86_64](#windows-x86_64) - [Flash-Attention 2.8.3](#flash-attention-283) @@ -963,6 +965,53 @@ ## 🐧 Linux arm64 +### Flash-Attention 2.8.3 + +
+Packages for Flash-Attention 2.8.3 + +| Python | PyTorch | CUDA | package | +| ------ | ------- | ---- | ------- | +| 3.10 | 2.5 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu124torch2.5-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.5 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.5-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.6 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.6-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.7 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.7-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.9 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu124torch2.9-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.9 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.9-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.9 | 13.0 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu130torch2.9-cp310-cp310-linux_aarch64.whl) | +| 3.11 | 2.5 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu124torch2.5-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.5 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.5-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.6 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.6-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.7 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.7-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.9 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu124torch2.9-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.9 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.9-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.9 | 13.0 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu130torch2.9-cp311-cp311-linux_aarch64.whl) | +| 3.12 | 2.5 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu124torch2.5-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.5 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.5-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.6 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.6-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.7 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.7-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.9 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu124torch2.9-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.9 | 12.8 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu128torch2.9-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.9 | 13.0 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.8.3%2Bcu130torch2.9-cp312-cp312-linux_aarch64.whl) | + +
+ +### Flash-Attention 2.7.4 + +
+Packages for Flash-Attention 2.7.4 + +| Python | PyTorch | CUDA | package | +| ------ | ------- | ---- | ------- | +| 3.10 | 2.5 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.7.4%2Bcu124torch2.5-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.9 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.7.4%2Bcu124torch2.9-cp310-cp310-linux_aarch64.whl) | +| 3.11 | 2.5 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.7.4%2Bcu124torch2.5-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.9 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.7.4%2Bcu124torch2.9-cp311-cp311-linux_aarch64.whl) | +| 3.12 | 2.5 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.7.4%2Bcu124torch2.5-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.9 | 12.4 | [Download1(v0.6.4)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.4/flash_attn-2.7.4%2Bcu124torch2.9-cp312-cp312-linux_aarch64.whl) | + +
+ ### Flash-Attention 2.6.3
diff --git a/docs/release_history.md b/docs/release_history.md index 5dcf993..aafc8dd 100644 --- a/docs/release_history.md +++ b/docs/release_history.md @@ -1,5 +1,16 @@ ## History +### v0.6.4 + +[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.6.4) + +#### Linux arm64 + +| Flash-Attention | Python | PyTorch | CUDA | +| --- | --- | --- | --- | +| 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 | + + ### v0.6.3 [Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.6.3)