From bc847f013078cba400f93b4190055cdcb8fb7a2d Mon Sep 17 00:00:00 2001 From: "github-actions[bot]" <41898282+github-actions[bot]@users.noreply.github.com> Date: Fri, 5 Dec 2025 10:43:44 +0000 Subject: [PATCH] docs: update docs for v0.6.3 --- docs/packages.md | 35 +++++++++++++++++++++++++++++++++++ docs/release_history.md | 11 +++++++++++ 2 files changed, 46 insertions(+) diff --git a/docs/packages.md b/docs/packages.md index 0f5d20f..16bf79c 100644 --- a/docs/packages.md +++ b/docs/packages.md @@ -21,6 +21,8 @@ - [Flash-Attention 2.5.6](#flash-attention-256) - [Flash-Attention 2.4.3](#flash-attention-243) - [Flash-Attention 1.0.9](#flash-attention-109) +- [Linux arm64](#linux-arm64) + - [Flash-Attention 2.6.3](#flash-attention-263) - [Windows x86_64](#windows-x86_64) - [Flash-Attention 2.8.3](#flash-attention-283) - [Flash-Attention 2.8.2](#flash-attention-282) @@ -959,6 +961,39 @@ +## 🐧 Linux arm64 + +### Flash-Attention 2.6.3 + +
+Packages for Flash-Attention 2.6.3 + +| Python | PyTorch | CUDA | package | +| ------ | ------- | ---- | ------- | +| 3.10 | 2.5 | 12.4 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu124torch2.5-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.5 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.5-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.6 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.6-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.7 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.7-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.9 | 12.4 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu124torch2.9-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.9 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.9-cp310-cp310-linux_aarch64.whl) | +| 3.10 | 2.9 | 13.0 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu130torch2.9-cp310-cp310-linux_aarch64.whl) | +| 3.11 | 2.5 | 12.4 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu124torch2.5-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.5 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.5-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.6 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.6-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.7 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.7-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.9 | 12.4 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu124torch2.9-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.9 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.9-cp311-cp311-linux_aarch64.whl) | +| 3.11 | 2.9 | 13.0 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu130torch2.9-cp311-cp311-linux_aarch64.whl) | +| 3.12 | 2.5 | 12.4 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu124torch2.5-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.5 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.5-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.6 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.6-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.7 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.7-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.9 | 12.4 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu124torch2.9-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.9 | 12.8 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu128torch2.9-cp312-cp312-linux_aarch64.whl) | +| 3.12 | 2.9 | 13.0 | [Download1(v0.6.3)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.6.3/flash_attn-2.6.3%2Bcu130torch2.9-cp312-cp312-linux_aarch64.whl) | + +
+ ## 🪟 Windows x86_64 ### Flash-Attention 2.8.3 diff --git a/docs/release_history.md b/docs/release_history.md index 3b0c810..5dcf993 100644 --- a/docs/release_history.md +++ b/docs/release_history.md @@ -1,5 +1,16 @@ ## History +### v0.6.3 + +[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.6.3) + +#### Linux arm64 + +| Flash-Attention | Python | PyTorch | CUDA | +| --- | --- | --- | --- | +| 2.6.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 | + + ### v0.5.4 [Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.5.4)