Skip to content

Commit

Permalink
Switch to cutlass 3.1, disable nvcc --threads
Browse files Browse the repository at this point in the history
  • Loading branch information
tridao committed Aug 14, 2023
1 parent 922fcda commit 5e005c0
Show file tree
Hide file tree
Showing 4 changed files with 9 additions and 5 deletions.
4 changes: 4 additions & 0 deletions .github/workflows/publish.yml
Original file line number Diff line number Diff line change
Expand Up @@ -91,8 +91,12 @@ jobs:
- name: Free up disk space
if: ${{ runner.os == 'Linux' }}
# https://github.com/easimon/maximize-build-space/blob/master/action.yml
# https://github.com/easimon/maximize-build-space/tree/test-report
run: |
sudo rm -rf /usr/share/dotnet
sudo rm -rf /opt/ghc
sudo rm -rf /opt/hostedtoolcache/CodeQL
- name: Install CUDA ${{ matrix.cuda-version }}
if: ${{ matrix.cuda-version != 'cpu' }}
Expand Down
2 changes: 1 addition & 1 deletion csrc/cutlass
Submodule cutlass updated 735 files
2 changes: 1 addition & 1 deletion flash_attn/__init__.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
__version__ = "2.0.6.post3"
__version__ = "2.0.6.post4"

from flash_attn.flash_attn_interface import flash_attn_func
from flash_attn.flash_attn_interface import flash_attn_kvpacked_func
Expand Down
6 changes: 3 additions & 3 deletions setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -91,9 +91,9 @@ def raise_if_cuda_home_none(global_option: str) -> None:


def append_nvcc_threads(nvcc_extra_args):
_, bare_metal_version = get_cuda_bare_metal_version(CUDA_HOME)
if bare_metal_version >= Version("11.2"):
return nvcc_extra_args + ["--threads", "4"]
# _, bare_metal_version = get_cuda_bare_metal_version(CUDA_HOME)
# if bare_metal_version >= Version("11.2"):
# return nvcc_extra_args + ["--threads", "4"]
return nvcc_extra_args


Expand Down

0 comments on commit 5e005c0

Please sign in to comment.