Skip to content

Commit a777a86

Browse files
committed
[dl-cifar] Use -O3 -ffast-math in all versions
Only SYCL version used fast math and only SYCL and HIP used -O3, whereas CUDA used -O2. This created an unfair comparison between the programming models. Align the compilation flags to use -O3 -ffast-math everywhere.
1 parent 890d3f0 commit a777a86

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

dl-cifar/CUDA/CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@ option(USE_SM "Specifies which streaming multiprocessor archite
3434
option(DEVICE_TIMER "Build using Device Timer" OFF)
3535

3636
set(DEF_WL_CXX_FLAGS " ")
37-
set(DEF_GENERAL_CXX_FLAGS " -O2 ")
37+
set(DEF_GENERAL_CXX_FLAGS " -O3 -ffast-math ")
3838
set(DEF_COMBINED_CXX_FLAGS "${DEF_GENERAL_CXX_FLAGS} ${DEF_WL_CXX_FLAGS}")
3939

4040
set(SOURCES
@@ -114,4 +114,4 @@ set(CUDA_SEPARABLE_COMPILATION ON)
114114
message(STATUS "CXX Compilation flags to: ${CMAKE_CXX_FLAGS}")
115115
link_libraries(stdc++fs cublas cudnn)
116116
cuda_add_executable(${PROJECT_NAME} ${SOURCES})
117-
target_link_libraries(${PROJECT_NAME} ${CUDA_LIBRARIES})
117+
target_link_libraries(${PROJECT_NAME} ${CUDA_LIBRARIES})

dl-cifar/HIP/CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@ option(DEVICE_TIMER "Build using Device Timer" OFF)
3333

3434

3535
set(DEF_WL_CXX_FLAGS " -D__HIP_PLATFORM_AMD__ ")
36-
set(DEF_GENERAL_CXX_FLAGS " -Wall -O3 -Wextra ")
36+
set(DEF_GENERAL_CXX_FLAGS " -Wall -O3 -ffast-math -Wextra ")
3737
set(DEF_COMBINED_CXX_FLAGS "${DEF_GENERAL_CXX_FLAGS} ${DEF_WL_CXX_FLAGS}")
3838

3939

0 commit comments

Comments
 (0)