We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4afe687 commit b639327Copy full SHA for b639327
CMakeLists.txt
@@ -171,16 +171,6 @@ if(NVCC_THREADS AND VLLM_GPU_LANG STREQUAL "CUDA")
171
list(APPEND VLLM_GPU_FLAGS "--threads=${NVCC_THREADS}")
172
endif()
173
174
-#
175
-# Set nvcc fatbin compression.
176
177
-if(VLLM_GPU_LANG STREQUAL "CUDA")
178
- if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER_EQUAL 12.8)
179
- list(APPEND VLLM_GPU_FLAGS "-Xfatbin" "-compress-all" "-compress-mode=size")
180
- endif()
181
-endif()
182
-
183
184
#
185
# Use FetchContent for C++ dependencies that are compiled as part of vLLM's build process.
186
# setup.py will override FETCHCONTENT_BASE_DIR to play nicely with sccache.
0 commit comments