3.4.3.5.4 : Le CMakeLists.txt
Écrivons le fichier CMakeLists.txt :
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 |
remove_definitions(-O3 -O2) if(USE_TBB) set(EXTRA_DEPENDENCIES tensor_alloc data_stream TBB::tbb) else() set(EXTRA_DEPENDENCIES tensor_alloc data_stream) endif() set(CONFIG_GPU_HADAMARD "10000,20000,30000,40000,50000,100000,500000,1000000,2000000,5000000,10000000,50000000,100000000") set(progSrc hadamard.cpp main.cpp) if(USE_TBB) message(STATUS "Activate TBB tests") phoenix_compileAndRunExample(perf_hadamard_gpupar_O0 "-O0" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O1 "-O1" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O2 "-O2" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O3 "-O3" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O4 "-O4" "${CONFIG_GPU_HADAMARD}" ${progSrc}) set(FLAG_VECTORIZATION "-mavx2 -ftree-vectorize -march=native -mtune=native") if(GPU_MODE) set(FLAG_VECTORIZATION "-mavx2") endif(GPU_MODE) phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O3 "-O3 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O4 "-O4 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) endif(USE_TBB) if(GPU_MODE) message(STATUS "Activate GPU NVC++ tests") # Minimum capabilities to use stdpar cc60 set(GPU_EXTRA_FLAGS "-stdpar=gpu -std=c++17") set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${GPU_EXTRA_FLAGS}") # set(GPU_EXTRA_FLAGS " -stdpar=gpu -gpu=cc60") # nvc++-Fatal-nvc++-Fatal-The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80. The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80 # set(GPU_EXTRA_FLAGS " -stdpar -gpu=cc50") #capabilities for the quadro M2200 # set(CMAKE_LINK_LIBRARY_FLAG "${CMAKE_LINK_LIBRARY_FLAG} -Mcuda ") phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O1 "-O1 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O3 "-O3 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O4 "-O4 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_plotPerfLogX("hadamard_gpuparParallelGPU" perf_hadamard_gpu_stdpar_par_vectorize_O1 perf_hadamard_gpu_stdpar_par_vectorize_O3 # Compile and works but not for quadro M2200 (too old) perf_hadamard_gpu_stdpar_par_vectorize_O4 ) if(USE_TBB) phoenix_plotPerfLogX("hadamard_gpuparParallelGPUcmp" perf_hadamard_gpupar_O3 perf_hadamard_gpupar_vectorize_O3 perf_hadamard_gpupar_vectorize_O4 perf_hadamard_gpu_stdpar_par_vectorize_O3 # Compile and works but not for quadro M2200 (too old) perf_hadamard_gpu_stdpar_par_vectorize_O4 ) phoenix_plotPerfLogX("hadamard_gpuparBase" perf_hadamard_gpupar_O0 perf_hadamard_gpupar_O1 perf_hadamard_gpupar_O2 perf_hadamard_gpupar_O3 perf_hadamard_gpupar_O4) phoenix_plotPerfLogX("hadamard_gpuparVectorize" perf_hadamard_gpupar_O3 perf_hadamard_gpupar_vectorize_O3 perf_hadamard_gpupar_vectorize_O4) endif(USE_TBB) endif(GPU_MODE) |
Le fichier CMakeLists.txt complet :
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 |
remove_definitions(-O3 -O2) if(USE_TBB) set(EXTRA_DEPENDENCIES tensor_alloc data_stream TBB::tbb) else() set(EXTRA_DEPENDENCIES tensor_alloc data_stream) endif() set(CONFIG_GPU_HADAMARD "10000,20000,30000,40000,50000,100000,500000,1000000,2000000,5000000,10000000,50000000,100000000") set(progSrc hadamard.cpp main.cpp) if(USE_TBB) message(STATUS "Activate TBB tests") phoenix_compileAndRunExample(perf_hadamard_gpupar_O0 "-O0" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O1 "-O1" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O2 "-O2" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O3 "-O3" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_O4 "-O4" "${CONFIG_GPU_HADAMARD}" ${progSrc}) set(FLAG_VECTORIZATION "-mavx2 -ftree-vectorize -march=native -mtune=native") if(GPU_MODE) set(FLAG_VECTORIZATION "-mavx2") endif(GPU_MODE) phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O3 "-O3 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O4 "-O4 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) endif(USE_TBB) if(GPU_MODE) message(STATUS "Activate GPU NVC++ tests") # Minimum capabilities to use stdpar cc60 set(GPU_EXTRA_FLAGS "-stdpar=gpu -std=c++17") set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${GPU_EXTRA_FLAGS}") # set(GPU_EXTRA_FLAGS " -stdpar=gpu -gpu=cc60") # nvc++-Fatal-nvc++-Fatal-The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80. The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80 # set(GPU_EXTRA_FLAGS " -stdpar -gpu=cc50") #capabilities for the quadro M2200 # set(CMAKE_LINK_LIBRARY_FLAG "${CMAKE_LINK_LIBRARY_FLAG} -Mcuda ") phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O1 "-O1 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O3 "-O3 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O4 "-O4 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc}) phoenix_plotPerfLogX("hadamard_gpuparParallelGPU" perf_hadamard_gpu_stdpar_par_vectorize_O1 perf_hadamard_gpu_stdpar_par_vectorize_O3 # Compile and works but not for quadro M2200 (too old) perf_hadamard_gpu_stdpar_par_vectorize_O4 ) if(USE_TBB) phoenix_plotPerfLogX("hadamard_gpuparParallelGPUcmp" perf_hadamard_gpupar_O3 perf_hadamard_gpupar_vectorize_O3 perf_hadamard_gpupar_vectorize_O4 perf_hadamard_gpu_stdpar_par_vectorize_O3 # Compile and works but not for quadro M2200 (too old) perf_hadamard_gpu_stdpar_par_vectorize_O4 ) phoenix_plotPerfLogX("hadamard_gpuparBase" perf_hadamard_gpupar_O0 perf_hadamard_gpupar_O1 perf_hadamard_gpupar_O2 perf_hadamard_gpupar_O3 perf_hadamard_gpupar_O4) phoenix_plotPerfLogX("hadamard_gpuparVectorize" perf_hadamard_gpupar_O3 perf_hadamard_gpupar_vectorize_O3 perf_hadamard_gpupar_vectorize_O4) endif(USE_TBB) endif(GPU_MODE) |
Le fichier CMakeLists.txt est disponible ici.