Skip to content

Commit b639327

Browse files
authored
Revert "Use NVCC --compress-mode to reduce binary size by 30% #20694" (#20853)
Signed-off-by: mgoin <mgoin64@gmail.com>
1 parent 4afe687 commit b639327

File tree

1 file changed

+0
-10
lines changed

1 file changed

+0
-10
lines changed

CMakeLists.txt

Lines changed: 0 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -171,16 +171,6 @@ if(NVCC_THREADS AND VLLM_GPU_LANG STREQUAL "CUDA")
171171
list(APPEND VLLM_GPU_FLAGS "--threads=${NVCC_THREADS}")
172172
endif()
173173

174-
#
175-
# Set nvcc fatbin compression.
176-
#
177-
if(VLLM_GPU_LANG STREQUAL "CUDA")
178-
if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER_EQUAL 12.8)
179-
list(APPEND VLLM_GPU_FLAGS "-Xfatbin" "-compress-all" "-compress-mode=size")
180-
endif()
181-
endif()
182-
183-
184174
#
185175
# Use FetchContent for C++ dependencies that are compiled as part of vLLM's build process.
186176
# setup.py will override FETCHCONTENT_BASE_DIR to play nicely with sccache.

0 commit comments

Comments
 (0)