lldacing
/

flash-attention-windows-wheel

Model card Files Files and versions Community

lldacing commited on 18 days ago

Commit

29f5d34

•

1 Parent(s): 125c306

Upload 9 files

Browse files

Files changed (10) hide show

.gitattributes +8 -0
WindowsWhlBuilder_cuda.bat +75 -0
flash_attn-2.7.0.post2+cu124torch2.4.0cxx11abiFALSE-cp311-cp311-win_amd64.whl +3 -0
flash_attn-2.7.0.post2+cu124torch2.4.0cxx11abiFALSE-cp312-cp312-win_amd64.whl +3 -0
flash_attn-2.7.0.post2+cu124torch2.4.1cxx11abiFALSE-cp311-cp311-win_amd64.whl +3 -0
flash_attn-2.7.0.post2+cu124torch2.4.1cxx11abiFALSE-cp312-cp312-win_amd64.whl +3 -0
flash_attn-2.7.0.post2+cu124torch2.5.0cxx11abiFALSE-cp311-cp311-win_amd64.whl +3 -0
flash_attn-2.7.0.post2+cu124torch2.5.0cxx11abiFALSE-cp312-cp312-win_amd64.whl +3 -0
flash_attn-2.7.0.post2+cu124torch2.5.1cxx11abiFALSE-cp311-cp311-win_amd64.whl +3 -0
flash_attn-2.7.0.post2+cu124torch2.5.1cxx11abiFALSE-cp312-cp312-win_amd64.whl +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,11 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.4.0cxx11abiFALSE-cp311-cp311-win_amd64.whl filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.4.0cxx11abiFALSE-cp312-cp312-win_amd64.whl filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.4.1cxx11abiFALSE-cp311-cp311-win_amd64.whl filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.4.1cxx11abiFALSE-cp312-cp312-win_amd64.whl filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.5.0cxx11abiFALSE-cp311-cp311-win_amd64.whl filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.5.0cxx11abiFALSE-cp312-cp312-win_amd64.whl filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.5.1cxx11abiFALSE-cp311-cp311-win_amd64.whl filter=lfs diff=lfs merge=lfs -text
+flash_attn-2.7.0.post2+cu124torch2.5.1cxx11abiFALSE-cp312-cp312-win_amd64.whl filter=lfs diff=lfs merge=lfs -text

WindowsWhlBuilder_cuda.bat ADDED Viewed

	@@ -0,0 +1,75 @@

+@echo off
+setlocal enabledelayedexpansion
+:parseArgs
+if [%1] == [WORKERS] set MAX_JOBS=%2 & shift & shift & goto :parseargs
+if [%1] == [FORCE_CXX11_ABI] set FLASH_ATTENTION_FORCE_CXX11_ABI=%2 & shift & shift & goto :parseargs
+goto :buildContinue
+:end
+:buildFinalize
+set MAX_JOBS=
+set BUILD_TARGET=
+set DISTUTILS_USE_SDK=
+set FLASH_ATTENTION_FORCE_BUILD=
+set FLASH_ATTENTION_FORCE_CXX11_ABI=
+set dist_dir=
+set tmpname=
+endlocal
+goto :eof
+:end
+:buildContinue
+echo MAX_JOBS: %MAX_JOBS%
+echo FLASH_ATTENTION_FORCE_CXX11_ABI: %FLASH_ATTENTION_FORCE_CXX11_ABI%
+rem # We want setuptools >= 49.6.0 otherwise we can't compile the extension if system CUDA version is 11.7 and pytorch cuda version is 11.6
+rem # https://github.com/pytorch/pytorch/blob/664058fa83f1d8eede5d66418abff6e20bd76ca8/torch/utils/cpp_extension.py#L810
+rem # However this still fails so I'm using a newer version of setuptools
+rem pip install setuptools==68.0.0
+pip install "setuptools>=49.6.0" ninja packaging wheel psutil
+rem # Limit MAX_JOBS otherwise the github runner goes OOM
+rem # CUDA 11.8 can compile with 2 jobs, but CUDA 12.3 goes OOM
+set FLASH_ATTENTION_FORCE_BUILD=TRUE
+set BUILD_TARGET=cuda
+set DISTUTILS_USE_SDK=1
+set dist_dir=dist
+python setup.py bdist_wheel --dist-dir=%dist_dir%
+rem rename whl
+rem just major version, such as cu12torch24cxx11abiFALSE
+rem for /f "delims=" %%i in ('python -c "import sys; from packaging.version import parse; import torch; python_version = f'cp{sys.version_info.major}{sys.version_info.minor}'; cxx11_abi=str(torch._C._GLIBCXX_USE_CXX11_ABI).upper(); torch_cuda_version = parse(torch.version.cuda); torch_cuda_version = parse(\"11.8\") if torch_cuda_version.major == 11 else parse(\"12.4\"); cuda_version = f'{torch_cuda_version.major}'; torch_version_raw = parse(torch.__version__); torch_version = f'{torch_version_raw.major}.{torch_version_raw.minor}'; wheel_filename = f'cu{cuda_version}torch{torch_version}cxx11abi{cxx11_abi}'; print(wheel_filename);"') do set wheel_filename=%%i
+rem such as cu124torch240cxx11abiFALSE
+for /f "delims=" %%i in ('python -c "import sys; from packaging.version import parse; import torch; python_version = f'cp{sys.version_info.major}{sys.version_info.minor}'; cxx11_abi=str(torch._C._GLIBCXX_USE_CXX11_ABI).upper(); torch_cuda_version = parse(torch.version.cuda); cuda_version = \"\".join(map(str, torch_cuda_version.release)); torch_version_raw = parse(torch.__version__); torch_version = \".\".join(map(str, torch_version_raw.release)); wheel_filename = f'cu{cuda_version}torch{torch_version}cxx11abi{cxx11_abi}'; print(wheel_filename);"') do set wheel_filename=%%i
+set tmpname=%wheel_filename%
+for %%i in (%dist_dir%\*.whl) do (
+    set "filename=%%~nxi"
+    rem check if contains +
+    echo !filename! | findstr /c:+ >nul
+    if errorlevel 1 (
+        rem replace second '-' to wheel_filename
+        set "count=0"
+        for /l %%j in (0, 1, 1000) do (
+            if "!filename:~%%j,1!"=="-" set /a count+=1
+            if "!filename:~%%j,1!"=="-" if "!count!"=="2" (
+                set "new_filename=!filename:~0,%%j!+%tmpname%!filename:~%%j!"
+                echo Renaming !filename! to !new_filename!
+                move "%%i" "!dist_dir!/!new_filename!"
+                goto :next
+            )
+        )
+    )
+    :next
+    rem continue
+)
+goto :buildFinalize
+:end

flash_attn-2.7.0.post2+cu124torch2.4.0cxx11abiFALSE-cp311-cp311-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8cc73333f05fcf553ee322446d02bd343415f0c3fd3ed92a2f4aa15d503e3f54
+size 182257178

flash_attn-2.7.0.post2+cu124torch2.4.0cxx11abiFALSE-cp312-cp312-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6c68e07b59cb5440f754074d977e29d7b7f17674a85eea0f8d2b49ab47ba345e
+size 182257119

flash_attn-2.7.0.post2+cu124torch2.4.1cxx11abiFALSE-cp311-cp311-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e3b5a1f800a83c9f2b479186b8f40f6ee8aff4eaac53d2c54913c7375fd10e8
+size 182256553

flash_attn-2.7.0.post2+cu124torch2.4.1cxx11abiFALSE-cp312-cp312-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3eed5f4f58a3380dadf2101b80791aa83c8b54b0a78e8462596553601296e050
+size 182257173

flash_attn-2.7.0.post2+cu124torch2.5.0cxx11abiFALSE-cp311-cp311-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:676cf819b37db68f48a9fa58ae294062d72fe183e0a0e7f8edabc6e5fadbda5f
+size 182256051

flash_attn-2.7.0.post2+cu124torch2.5.0cxx11abiFALSE-cp312-cp312-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0185455c78800164c52999f404717938ff31c58c056ff732eae06b1f4bc795fc
+size 182256077

flash_attn-2.7.0.post2+cu124torch2.5.1cxx11abiFALSE-cp311-cp311-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc0cf06b8a0a3afc2c803f624abf60b5002522c9021834a2d83a627fad401201
+size 182255995

flash_attn-2.7.0.post2+cu124torch2.5.1cxx11abiFALSE-cp312-cp312-win_amd64.whl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:608d2247f1d442c37e67c0507526456714cb19df3c6e0a080ae72131e78b36ba
+size 182256160