mirror of
https://github.com/BillyOutlast/flash-attention.git
synced 2026-06-30 21:07:55 -04:00
ci: Use 1 ninja job for cu13 (#2195)
Signed-off-by: oliver könig <okoenig@nvidia.com>
This commit is contained in:
@@ -165,7 +165,7 @@ jobs:
|
||||
# Limit MAX_JOBS otherwise the github runner goes OOM
|
||||
# nvcc 11.8 can compile with 2 jobs, but nvcc 12.3 goes OOM
|
||||
|
||||
export MAX_JOBS=$([ "$MATRIX_CUDA_VERSION" == "129" ] && echo 1 || echo 2)
|
||||
export MAX_JOBS=$([ "$MATRIX_CUDA_VERSION" == "129" ] || [ "$MATRIX_CUDA_VERSION" == "130" ] && echo 1 || echo 2)
|
||||
export NVCC_THREADS=2
|
||||
export FLASH_ATTENTION_FORCE_BUILD="TRUE"
|
||||
export FLASH_ATTENTION_FORCE_CXX11_ABI=${{ inputs.cxx11_abi }}
|
||||
|
||||
Reference in New Issue
Block a user