From 814e0b4067c6e3d6fe34e0ea0bed02cfee65249a Mon Sep 17 00:00:00 2001
From: Junya Morioka <mjun@mjunya.com>
Date: Thu, 27 Nov 2025 12:06:11 +0900
Subject: [PATCH] chore: Update docs and regenerate packages

---
 README.md          |  4 ++++
 create_matrix.py   | 46 +++++++++++++++++++++++++++-------------------
 create_packages.py |  7 ++++++-
 docs/packages.md   |  6 +++++-
 4 files changed, 42 insertions(+), 21 deletions(-)

diff --git a/README.md b/README.md
index 959e015..febb2ca 100644
--- a/README.md
+++ b/README.md
@@ -42,6 +42,10 @@ pip install ./flash_attn-2.6.3+cu124torch2.5-cp312-cp312-linux_x86_64.whl
 
 ## Packages
 
+> [!NOTE]
+> Since v0.5.0, wheels are built with a local version label indicating the CUDA and PyTorch versions.  
+> Example: `pip list` -> `flash_attn==2.8.3 -> flash_attn==2.8.3+cu130torch2.9`
+
 See [./docs/packages.md](./docs/packages.md) for the full list of available packages.
 
 ## History
diff --git a/create_matrix.py b/create_matrix.py
index 5bb01cd..034f5d9 100644
--- a/create_matrix.py
+++ b/create_matrix.py
@@ -22,21 +22,20 @@ EXCLUDE = [
 ]
 
 LINUX_MATRIX = {
-    "flash-attn-version": [
-        # "2.6.3", "2.7.4.post1"
-        "2.8.3"
-    ],
-    "python-version": [
-        # "3.10", "3.11", "3.12",
-        "3.13"
-    ],
+    "flash-attn-version": ["2.6.3", "2.7.4", "2.8.3"],
+    "python-version": ["3.10", "3.11", "3.12", "3.13"],
     "torch-version": [
-        # "2.5.1", "2.6.0", "2.7.1", "2.8.0",
+        "2.5.1",
+        "2.6.0",
+        "2.7.1",
+        "2.8.0",
         "2.9.1",
     ],
     "cuda-version": [
-        # "12.4.1", "12.6.3", "12.8.1", "12.9.1",
-        # "12.8.1",
+        "12.4.1",
+        "12.6.3",
+        "12.8.1",
+        "12.9.1",
         "13.0.2",
     ],
 }
@@ -50,20 +49,29 @@ LINUX_SELF_HOSTED_MATRIX = {
 
 WINDOWS_MATRIX = {
     "flash-attn-version": [
-        # "2.7.4.post1",
-        "2.8.3"
+        "2.6.3",
+        "2.7.4",
+        "2.8.3",
     ],
     "python-version": [
-        # "3.10", "3.11", "3.12",
-        "3.13"
+        "3.10",
+        "3.11",
+        "3.12",
+        "3.13",
     ],
     "torch-version": [
-        # "2.5.1", "2.6.0", "2.7.1", "2.8.0",
-        "2.9.1"
+        "2.5.1",
+        "2.6.0",
+        "2.7.1",
+        "2.8.0",
+        "2.9.1",
     ],
     "cuda-version": [
-        # "12.4.1", "12.6.3", "12.8.1", "12.9.1",
-        "13.0.1"
+        "12.4.1",
+        "12.6.3",
+        "12.8.1",
+        "12.9.1",
+        "13.0.2",
     ],
 }
 
diff --git a/create_packages.py b/create_packages.py
index e54fbab..6aca0cd 100644
--- a/create_packages.py
+++ b/create_packages.py
@@ -15,6 +15,11 @@ import pandas as pd
 
 from common import normalize_platform_name, parse_wheel_filename
 
+ADD_NOTE = """> [!NOTE]
+> Since v0.5.0, wheels are built with a local version label indicating the CUDA and PyTorch versions.  
+> Example: `pip list` -> `flash_attn==2.8.3 -> flash_attn==2.8.3+cu130torch2.9`
+"""
+
 
 def parse_numeric_version(text: str) -> tuple:
     """Extract numeric version tuple for sorting."""
@@ -496,7 +501,7 @@ def main() -> None:
     output_path.parent.mkdir(parents=True, exist_ok=True)
 
     # Generate markdown with "# Packages" header for standalone file
-    standalone_markdown = f"# Packages\n\n{markdown}"
+    standalone_markdown = f"# Packages\n\n{ADD_NOTE}\n{markdown}"
 
     with output_path.open("w", encoding="utf-8") as f:
         f.write(standalone_markdown)
diff --git a/docs/packages.md b/docs/packages.md
index 0bc393d..08b8d56 100644
--- a/docs/packages.md
+++ b/docs/packages.md
@@ -1,5 +1,9 @@
 # Packages
 
+> [!NOTE]
+> Since v0.5.0, wheels are built with a local version label indicating the CUDA and PyTorch versions.  
+> Example: `pip list` -> `flash_attn==2.8.3 -> flash_attn==2.8.3+cu130torch2.9`
+
 ## Table of Contents
 
 - [Linux x86_64](#linux-x86_64)
@@ -106,7 +110,7 @@
 | 3.13 | 2.8 | 12.9 | [Download1(v0.4.12)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.12/flash_attn-2.8.3%2Bcu129torch2.8-cp313-cp313-linux_x86_64.whl) |
 | 3.13 | 2.9 | 12.6 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3%2Bcu126torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3%2Bcu126torch2.9-cp313-cp313-linux_x86_64.whl) |
 | 3.13 | 2.9 | 12.8 | [Download1(v0.4.17)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.17/flash_attn-2.8.3%2Bcu128torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.15)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.15/flash_attn-2.8.3%2Bcu128torch2.9-cp313-cp313-linux_x86_64.whl) |
-| 3.13 | 2.9 | 13.0 | [Download1(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3%2Bcu130torch2.9-cp313-cp313-linux_x86_64.whl) |
+| 3.13 | 2.9 | 13.0 | [Download1(v0.5.2)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.5.2/flash_attn-2.8.3%2Bcu130torch2.9-cp313-cp313-linux_x86_64.whl), [Download2(v0.4.18)](https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.4.18/flash_attn-2.8.3%2Bcu130torch2.9-cp313-cp313-linux_x86_64.whl) |
 
 </details>