mirror of
https://github.com/BillyOutlast/flash-attention-prebuild-wheels-rocm.git
synced 2026-07-01 01:37:53 -04:00
refactor: rename docs to doc and pages to docs for GitHub Pages
- Rename docs/ to doc/ (contains packages.md, release_history.md, etc.) - Rename pages/ to docs/ (contains search page index.html) - Update all references in README.md, workflows, and Python scripts GitHub Pages only supports / or /docs as the source directory.
This commit is contained in:
Binary file not shown.
|
Before Width: | Height: | Size: 107 KiB |
@@ -1,206 +0,0 @@
|
||||
[
|
||||
{
|
||||
"timestamp": "2024-10-27T00:00:00+00:00",
|
||||
"total_downloads": 0
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-04T13:25:33.785415+00:00",
|
||||
"total_downloads": 906514
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-04T13:26:09.117076+00:00",
|
||||
"total_downloads": 906524
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-04T13:46:48.639327+00:00",
|
||||
"total_downloads": 906741
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-04T13:53:02.674280+00:00",
|
||||
"total_downloads": 906828
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-04T13:53:35.050423+00:00",
|
||||
"total_downloads": 906834
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-04T13:56:13.655744+00:00",
|
||||
"total_downloads": 906837
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-04T14:12:29.585666+00:00",
|
||||
"total_downloads": 907019
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-05T02:07:22.638150+00:00",
|
||||
"total_downloads": 913445
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-06T02:01:02.040321+00:00",
|
||||
"total_downloads": 929720
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-07T02:22:24.324150+00:00",
|
||||
"total_downloads": 941666
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-08T02:08:27.290730+00:00",
|
||||
"total_downloads": 954577
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-09T02:07:15.526725+00:00",
|
||||
"total_downloads": 969053
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-10T02:09:18.798442+00:00",
|
||||
"total_downloads": 984725
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-11T02:11:06.533847+00:00",
|
||||
"total_downloads": 999175
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-12T02:10:43.804376+00:00",
|
||||
"total_downloads": 1014577
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-13T02:03:59.555295+00:00",
|
||||
"total_downloads": 1030197
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-14T02:23:24.651189+00:00",
|
||||
"total_downloads": 1044084
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-15T02:20:57.379722+00:00",
|
||||
"total_downloads": 1057611
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-16T02:11:32.003530+00:00",
|
||||
"total_downloads": 1073249
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-17T02:06:31.128465+00:00",
|
||||
"total_downloads": 1092907
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-19T02:10:30.708440+00:00",
|
||||
"total_downloads": 1126692
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-20T02:03:34.736682+00:00",
|
||||
"total_downloads": 1140840
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-21T02:23:23.025497+00:00",
|
||||
"total_downloads": 1152592
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-22T02:22:22.608573+00:00",
|
||||
"total_downloads": 1165046
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-23T02:11:29.306262+00:00",
|
||||
"total_downloads": 1180840
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-24T02:09:36.492846+00:00",
|
||||
"total_downloads": 1196392
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-25T02:11:45.358891+00:00",
|
||||
"total_downloads": 1211783
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-26T02:10:43.618583+00:00",
|
||||
"total_downloads": 1225422
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-27T02:08:31.512530+00:00",
|
||||
"total_downloads": 1239979
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-28T02:29:31.978407+00:00",
|
||||
"total_downloads": 1253764
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-29T02:27:04.839226+00:00",
|
||||
"total_downloads": 1267980
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-30T02:12:18.789031+00:00",
|
||||
"total_downloads": 1281832
|
||||
},
|
||||
{
|
||||
"timestamp": "2025-12-31T02:12:59.928773+00:00",
|
||||
"total_downloads": 1295884
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-01T02:30:20.978230+00:00",
|
||||
"total_downloads": 1308150
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-02T02:20:37.631510+00:00",
|
||||
"total_downloads": 1319313
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-03T02:07:47.899993+00:00",
|
||||
"total_downloads": 1330611
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-04T02:31:30.898971+00:00",
|
||||
"total_downloads": 1342368
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-05T02:31:58.845097+00:00",
|
||||
"total_downloads": 1353341
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-06T02:20:11.131849+00:00",
|
||||
"total_downloads": 1367158
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-07T02:19:58.869512+00:00",
|
||||
"total_downloads": 1383482
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-08T02:20:33.794945+00:00",
|
||||
"total_downloads": 1399139
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-09T02:21:07.367934+00:00",
|
||||
"total_downloads": 1414967
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-10T02:10:52.025266+00:00",
|
||||
"total_downloads": 1429205
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-11T02:31:21.453872+00:00",
|
||||
"total_downloads": 1441034
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-12T02:26:36.790351+00:00",
|
||||
"total_downloads": 1452726
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-13T02:12:17.561263+00:00",
|
||||
"total_downloads": 1466508
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-14T02:25:34.083215+00:00",
|
||||
"total_downloads": 1481868
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-15T02:19:53.181117+00:00",
|
||||
"total_downloads": 1496011
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-16T02:21:54.143763+00:00",
|
||||
"total_downloads": 1510613
|
||||
},
|
||||
{
|
||||
"timestamp": "2026-01-17T02:09:18.614756+00:00",
|
||||
"total_downloads": 1523451
|
||||
}
|
||||
]
|
||||
+1033
File diff suppressed because it is too large
Load Diff
-1392
File diff suppressed because it is too large
Load Diff
@@ -1,383 +0,0 @@
|
||||
## History
|
||||
|
||||
### v0.7.7
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.7)
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.3 | 3.10, 3.11, 3.13 | 2.5, 2.7, 2.8 | 12.8 |
|
||||
|
||||
|
||||
### v0.7.6
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.6)
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --- | --- | --- | --- |
|
||||
| 2.8.3 | 3.12 | 2.9 | 12.8 |
|
||||
|
||||
|
||||
### v0.7.2
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.2)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------------- | ------------------ | ---------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.5, 2.6, 2.7, 2.8 | 12.8, 12.9 |
|
||||
|
||||
#### Manylinux 2_24 x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------------- | ------------- | ---------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.6, 2.7, 2.8 | 12.8, 12.9 |
|
||||
|
||||
#### Manylinux2014 x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------------- | ------- | ---- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.5 | 12.8 |
|
||||
|
||||
### v0.7.0
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.7.0)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ------- | ---------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.9 | 12.8, 13.0 |
|
||||
|
||||
### v0.6.9
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.6.9)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------- | ---- |
|
||||
| 2.6.3 | 3.14 | 2.9 | 13.0 |
|
||||
|
||||
### v0.6.4
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.6.4)
|
||||
|
||||
#### Linux arm64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------- |
|
||||
| 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 |
|
||||
|
||||
### v0.6.3
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.6.3)
|
||||
|
||||
#### Linux arm64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------- |
|
||||
| 2.6.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.9 | 12.4, 12.8, 13.0 |
|
||||
|
||||
### v0.5.4
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.5.4)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ----------------------- | ---------------------- |
|
||||
| 2.6.3, 2.7.4, 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8, 2.9 | 12.4, 12.6, 12.8, 13.0 |
|
||||
|
||||
### v0.4.22
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.22)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------------- | ------- | ---------- |
|
||||
| 2.8.1 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.8, 13.0 |
|
||||
|
||||
### v0.4.18
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.18)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------------- | ------- | ---- |
|
||||
| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 13.0 |
|
||||
|
||||
### v0.4.17
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.17)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------------- | ------- | ---------- |
|
||||
| 2.6.3, 2.8.3 | 3.10, 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 |
|
||||
|
||||
### v0.4.16
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.16)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------------------ | ---------- |
|
||||
| 2.6.3, 2.8.3 | 3.9 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6 |
|
||||
|
||||
### v0.4.15
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.15)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------- | ---------- |
|
||||
| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6, 12.8 |
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------- | ---- |
|
||||
| 2.8.3 | 3.11, 3.12, 3.13 | 2.9 | 12.6 |
|
||||
|
||||
### v0.4.12
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.12)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------------- | ---------------------- |
|
||||
| 2.8.3 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 |
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------------- | ---------- |
|
||||
| 2.8.2 | 3.13 | 2.6, 2.7, 2.8 | 12.4, 12.6 |
|
||||
|
||||
### v0.4.11
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.11)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------------- |
|
||||
| 2.8.3 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.6, 12.8, 12.9 |
|
||||
|
||||
### v0.4.10
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.10)
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | -------- | ---- |
|
||||
| 2.7.4, 2.8.2 | 3.10, 3.11, 3.12 | 2.7, 2.8 | 12.8 |
|
||||
|
||||
### v0.4.9
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.4.9)
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------- | ---- |
|
||||
| 2.7.4 | 3.11 | 2.7 | 12.8 |
|
||||
|
||||
### v0.3.18
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.3.18)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------------------ | ---------------- |
|
||||
| 2.7.4 | 3.10, 3.11, 3.12 | 2.5, 2.6, 2.7, 2.8 | 12.4, 12.8, 12.9 |
|
||||
|
||||
### v0.3.14
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.3.14)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | -------------------------- | ---------------------- |
|
||||
| 2.6.3, 2.8.2 | 3.10, 3.11, 3.12 | 2.5.1, 2.6.0, 2.7.1, 2.8.0 | 12.4.1, 12.8.1, 12.9.1 |
|
||||
|
||||
### v0.3.13
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.3.13)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | -------------------------- | ------ |
|
||||
| 2.8.1 | 3.10, 3.11, 3.12 | 2.4.1, 2.5.1, 2.6.0, 2.7.1 | 12.8.1 |
|
||||
|
||||
### v0.3.12
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.3.12)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | -------------------------- | -------------- |
|
||||
| 2.8.0 | 3.10, 3.11, 3.12 | 2.4.1, 2.5.1, 2.6.0, 2.7.1 | 12.4.1, 12.8.1 |
|
||||
|
||||
### v0.3.10
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.3.10)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ------- | ------ |
|
||||
| 2.7.4 | 3.10, 3.11, 3.12 | 2.7.1 | 12.8.1 |
|
||||
|
||||
### v0.3.9
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.3.9)
|
||||
|
||||
#### Linux x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ------- | ------ |
|
||||
| 2.4.3, 2.5.9, 2.6.3 | 3.10, 3.11, 3.12 | 2.7.1 | 12.8.1 |
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ------------------- | ------ |
|
||||
| 2.5.9, 2.6.3, 2.7.4 | 3.10, 3.11, 3.12 | 2.4.1, 2.5.1, 2.6.0 | 12.4.1 |
|
||||
|
||||
> [!IMPORTANT]
|
||||
> ⚠️ Building flash-attn v2.7.4 with CUDA 12.8 on Windows cannot be completed because of GitHub Actions’ processing-time limits. In the future, I plan to add a self-hosted Windows runner to resolve this issue.
|
||||
|
||||
### v0.3.1
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.3.1)
|
||||
|
||||
#### Windows x86_64
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ------ | ------- | ------ |
|
||||
| 2.6.3 | 3.11 | 2.6.0 | 12.6.3 |
|
||||
|
||||
From this version, Wheels for Windows are released.
|
||||
However, we are waiting for a report on how it works because we have not tested it enough.
|
||||
|
||||
### v0.2.1
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.2.1)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| -------------------------- | ---------------- | ----------------- | ------ |
|
||||
| 2.4.3, 2.5.9, 2.6.3, 2.7.4 | 3.10, 3.11, 3.12 | 2.8.0.dev20250523 | 12.8.1 |
|
||||
|
||||
### v0.2.0
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.2.0)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ----------------- | ------ |
|
||||
| 2.4.3, 2.5.9, 2.6.3 | 3.10, 3.11, 3.12 | 2.8.0.dev20250523 | 12.8.1 |
|
||||
|
||||
### v0.1.0
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.1.0)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| -------------------------- | ---------------- | ------- | ------ |
|
||||
| 2.4.3, 2.5.9, 2.6.3, 2.7.4 | 3.10, 3.11, 3.12 | 2.7.0 | 12.8.1 |
|
||||
|
||||
v2.7.4 and v2.7.4.post1 are the same version.
|
||||
|
||||
From this release, self-hosted runners are used for building some wheels.
|
||||
|
||||
### v0.0.9
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.9)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------- | ---------------- | ------- | ------ |
|
||||
| 2.4.3, 2.5.9, 2.6.3 | 3.10, 3.11, 3.12 | 2.7.0 | 12.8.1 |
|
||||
|
||||
### v0.0.8
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.8)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| -------------------------------- | ---------------- | -------------------------- | ---------------------- |
|
||||
| 2.4.3, 2.5.9, 2.6.3, 2.7.4.post1 | 3.10, 3.11, 3.12 | 2.4.1, 2.5.1, 2.6.0, 2.7.0 | 11.8.0, 12.4.1, 12.6.3 |
|
||||
|
||||
### v0.0.7
|
||||
|
||||
Skip for experimental reasons.
|
||||
|
||||
### v0.0.6
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.6)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| -------------------------------- | ---------------- | --------------------------------- | -------------- |
|
||||
| 2.4.3, 2.5.9, 2.6.3, 2.7.4.post1 | 3.10, 3.11, 3.12 | 2.2.2, 2.3.1, 2.4.1, 2.5.1, 2.6.0 | 12.4.1, 12.6.3 |
|
||||
|
||||
### v0.0.5
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.5)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| ------------------ | ---------------- | ----------------------------------------------- | -------------- |
|
||||
| 2.6.3, 2.7.4.post1 | 3.10, 3.11, 3.12 | 2.0.1, 2.1.2, 2.2.2, 2.3.1, 2.4.1, 2.5.1, 2.6.0 | 12.4.1, 12.6.3 |
|
||||
|
||||
### v0.0.4
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.4)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ---------------------------------------- | ---------------------- |
|
||||
| 2.7.3 | 3.10, 3.11, 3.12 | 2.0.1, 2.1.2, 2.2.2, 2.3.1, 2.4.1, 2.5.1 | 11.8.0, 12.1.1, 12.4.1 |
|
||||
|
||||
### v0.0.3
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.3)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| --------------- | ---------------- | ---------------------------------------- | ---------------------- |
|
||||
| 2.7.2.post1 | 3.10, 3.11, 3.12 | 2.0.1, 2.1.2, 2.2.2, 2.3.1, 2.4.1, 2.5.1 | 11.8.0, 12.1.1, 12.4.1 |
|
||||
|
||||
### v0.0.2
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.2)
|
||||
|
||||
| Flash-Attention | Python | PyTorch | CUDA |
|
||||
| -------------------------------- | ---------------- | ---------------------------------------- | ---------------------- |
|
||||
| 2.4.3, 2.5.6, 2.6.3, 2.7.0.post2 | 3.10, 3.11, 3.12 | 2.0.1, 2.1.2, 2.2.2, 2.3.1, 2.4.1, 2.5.1 | 11.8.0, 12.1.1, 12.4.1 |
|
||||
|
||||
### v0.0.1
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.1)
|
||||
|
||||
| flash-attention | Python | PyTorch | CUDA |
|
||||
| --------------------------------- | ---------------- | ---------------------------------------- | ---------------------- |
|
||||
| 1.0.9, 2.4.3, 2.5.6, 2.5.9, 2.6.3 | 3.10, 3.11, 3.12 | 2.0.1, 2.1.2, 2.2.2, 2.3.1, 2.4.1, 2.5.0 | 11.8.0, 12.1.1, 12.4.1 |
|
||||
|
||||
### v0.0.0
|
||||
|
||||
[Release](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/tag/v0.0.0)
|
||||
|
||||
| flash-attention | Python | PyTorch | CUDA |
|
||||
| -------------------------- | ---------- | ---------------------------------------- | ---------------------- |
|
||||
| 2.4.3, 2.5.6, 2.5.9, 2.6.3 | 3.11, 3.12 | 2.0.1, 2.1.2, 2.2.2, 2.3.1, 2.4.1, 2.5.0 | 11.8.0, 12.1.1, 12.4.1 |
|
||||
Reference in New Issue
Block a user