@@ -751,93 +751,29 @@ target_link_libraries(
751751)
752752set_target_properties (matrix_multiplication PROPERTIES COMPILE_FLAGS ${OpenMP_CXX_FLAGS} )
753753
754- ## benchmark 6: Parallel DNN
755- #message(STATUS "benchmark 6: Parallel DNN")
756- #set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${TF_BENCHMARK_DIR}/parallel_dnn)
757- #add_executable(
758- # parallel_dnn
759- # ${TF_BENCHMARK_DIR}/parallel_dnn/main.cpp
760- # ${TF_BENCHMARK_DIR}/parallel_dnn/omp.cpp
761- # ${TF_BENCHMARK_DIR}/parallel_dnn/tbb.cpp
762- # ${TF_BENCHMARK_DIR}/parallel_dnn/seq.cpp
763- # ${TF_BENCHMARK_DIR}/parallel_dnn/taskflow.cpp
764- #)
765- #target_include_directories(parallel_dnn PRIVATE ${PROJECT_SOURCE_DIR}/3rd-party/CLI11)
766- #target_link_libraries(
767- # parallel_dnn
768- # ${PROJECT_NAME}
769- # Threads::Threads
770- # ${TBB_IMPORTED_TARGETS}
771- # ${OpenMP_CXX_LIBRARIES}
772- # stdc++fs
773- # tf::default_settings
774- #)
775- #set_target_properties(parallel_dnn PROPERTIES COMPILE_FLAGS ${OpenMP_CXX_FLAGS})
776- #
777754
778-
779- ### benchmark 8: Mandelbrot set
780- #message(STATUS "benchmark 8: Mandelbrot set")
781- #set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${TF_BENCHMARK_DIR}/mandelbrot_set)
782- #add_executable(
783- # mandelbrot_set
784- # ${TF_BENCHMARK_DIR}/mandelbrot_set/main.cpp
785- # ${TF_BENCHMARK_DIR}/mandelbrot_set/omp.cpp
786- # ${TF_BENCHMARK_DIR}/mandelbrot_set/tbb.cpp
787- # ${TF_BENCHMARK_DIR}/mandelbrot_set/taskflow.cpp
788- #)
789- #target_include_directories(mandelbrot_set PRIVATE ${PROJECT_SOURCE_DIR}/3rd-party/CLI11)
790- #target_link_libraries(
791- # mandelbrot_set
792- # ${PROJECT_NAME}
793- # Threads::Threads
794- # ${TBB_IMPORTED_TARGETS}
795- # ${OpenMP_CXX_LIBRARIES}
796- # tf::default_settings
797- #)
798- #set_target_properties(mandelbrot_set PROPERTIES COMPILE_FLAGS ${OpenMP_CXX_FLAGS})
799- #
800- ### benchmark 9: Black–Scholes
801- #message(STATUS "benchmark 9: Black-Scholes Partial Differential Equation")
802- #set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${TF_BENCHMARK_DIR}/black_scholes)
803- #add_executable(
804- # black_scholes
805- # ${TF_BENCHMARK_DIR}/black_scholes/main.cpp
806- # ${TF_BENCHMARK_DIR}/black_scholes/omp.cpp
807- # ${TF_BENCHMARK_DIR}/black_scholes/tbb.cpp
808- # ${TF_BENCHMARK_DIR}/black_scholes/taskflow.cpp
809- #)
810- #target_include_directories(black_scholes PRIVATE ${PROJECT_SOURCE_DIR}/3rd-party/CLI11)
811- #target_link_libraries(
812- # black_scholes
813- # ${PROJECT_NAME}
814- # Threads::Threads
815- # ${TBB_IMPORTED_TARGETS}
816- # ${OpenMP_CXX_LIBRARIES}
817- # tf::default_settings
818- #)
819- #set_target_properties(black_scholes PROPERTIES COMPILE_FLAGS ${OpenMP_CXX_FLAGS})
820- #
821- ### benchmark 10: Strassen algorithm
822- #message(STATUS "benchmark 10: Strassen matrix multiplication algorithm")
823- #set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${TF_BENCHMARK_DIR}/strassen)
824- #add_executable(
825- # strassen
826- # ${TF_BENCHMARK_DIR}/strassen/main.cpp
827- # ${TF_BENCHMARK_DIR}/strassen/omp.cpp
828- # ${TF_BENCHMARK_DIR}/strassen/tbb.cpp
829- # ${TF_BENCHMARK_DIR}/strassen/taskflow.cpp
830- #)
831- #target_include_directories(strassen PRIVATE ${PROJECT_SOURCE_DIR}/3rd-party/CLI11)
832- #target_link_libraries(
833- # strassen
834- # ${PROJECT_NAME}
835- # Threads::Threads
836- # ${TBB_IMPORTED_TARGETS}
837- # ${OpenMP_CXX_LIBRARIES}
838- # tf::default_settings
839- #)
840- #set_target_properties(strassen PROPERTIES COMPILE_FLAGS ${OpenMP_CXX_FLAGS})
755+ if (${TF_ENABLE_CUDA} )
756+ ## cuda benchmark 1: heterogeneous traversal
757+ message (STATUS "cuda benchmark 1: heterogeneous traversal" )
758+ set (CMAKE_RUNTIME_OUTPUT_DIRECTORY ${TF_BENCHMARK_DIR} /hetero_traversal)
759+ add_executable (
760+ hetero_traversal
761+ ${TF_BENCHMARK_DIR} /hetero_traversal/main.cu
762+ ${TF_BENCHMARK_DIR} /hetero_traversal/taskflow.cu
763+ ${TF_BENCHMARK_DIR} /hetero_traversal/tbb.cu
764+ ${TF_BENCHMARK_DIR} /hetero_traversal/omp.cu
765+ )
766+ target_include_directories (hetero_traversal PRIVATE ${PROJECT_SOURCE_DIR} /3rd-party/CLI11 )
767+ target_link_libraries (
768+ hetero_traversal
769+ ${PROJECT_NAME}
770+ Threads::Threads
771+ ${TBB_IMPORTED_TARGETS}
772+ ${OpenMP_CXX_LIBRARIES}
773+ tf::default_settings
774+ )
775+ set_target_properties (hetero_traversal PROPERTIES COMPILE_FLAGS "-Xcompiler ${OpenMP_CXX_FLAGS} " )
776+ endif (${TF_ENABLE_CUDA} )
841777
842778endif ()
843779
0 commit comments