3.4.3.5.4 : Le CMakeLists.txt
Écrivons le fichier CMakeLists.txt :

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
remove_definitions(-O3 -O2)
if(USE_TBB)
	set(EXTRA_DEPENDENCIES tensor_alloc data_stream TBB::tbb)
else()
	set(EXTRA_DEPENDENCIES tensor_alloc data_stream)
endif()

set(CONFIG_GPU_HADAMARD "10000,20000,30000,40000,50000,100000,500000,1000000,2000000,5000000,10000000,50000000,100000000")

set(progSrc hadamard.cpp main.cpp)

if(USE_TBB)
	message(STATUS "Activate TBB tests")
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O0 "-O0" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O1 "-O1" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O2 "-O2" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O3 "-O3" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O4 "-O4" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	set(FLAG_VECTORIZATION "-mavx2 -ftree-vectorize -march=native -mtune=native")
	if(GPU_MODE)
		set(FLAG_VECTORIZATION "-mavx2")
	endif(GPU_MODE)
	phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O3 "-O3 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O4 "-O4 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
endif(USE_TBB)

if(GPU_MODE)
	message(STATUS "Activate GPU NVC++ tests")
	# Minimum capabilities to use stdpar cc60
	set(GPU_EXTRA_FLAGS "-stdpar=gpu -std=c++17")
	set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${GPU_EXTRA_FLAGS}")
# 	set(GPU_EXTRA_FLAGS " -stdpar=gpu -gpu=cc60")
# 	nvc++-Fatal-nvc++-Fatal-The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80. The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80
# 	set(GPU_EXTRA_FLAGS " -stdpar -gpu=cc50")	#capabilities for the quadro M2200
# 	set(CMAKE_LINK_LIBRARY_FLAG "${CMAKE_LINK_LIBRARY_FLAG} -Mcuda ")

	phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O1 "-O1 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	
	phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O3 "-O3 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O4 "-O4 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc})

	phoenix_plotPerfLogX("hadamard_gpuparParallelGPU"
				perf_hadamard_gpu_stdpar_par_vectorize_O1
				perf_hadamard_gpu_stdpar_par_vectorize_O3	# Compile and works but not for quadro M2200 (too old)
				perf_hadamard_gpu_stdpar_par_vectorize_O4
				)
	if(USE_TBB)
		phoenix_plotPerfLogX("hadamard_gpuparParallelGPUcmp"
				perf_hadamard_gpupar_O3
				perf_hadamard_gpupar_vectorize_O3
				perf_hadamard_gpupar_vectorize_O4
				perf_hadamard_gpu_stdpar_par_vectorize_O3	# Compile and works but not for quadro M2200 (too old)
				perf_hadamard_gpu_stdpar_par_vectorize_O4
				)
		phoenix_plotPerfLogX("hadamard_gpuparBase" perf_hadamard_gpupar_O0 perf_hadamard_gpupar_O1 perf_hadamard_gpupar_O2 perf_hadamard_gpupar_O3 perf_hadamard_gpupar_O4)
		phoenix_plotPerfLogX("hadamard_gpuparVectorize" perf_hadamard_gpupar_O3 perf_hadamard_gpupar_vectorize_O3 perf_hadamard_gpupar_vectorize_O4)
	endif(USE_TBB)
endif(GPU_MODE)


Le fichier CMakeLists.txt complet :

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
remove_definitions(-O3 -O2)
if(USE_TBB)
	set(EXTRA_DEPENDENCIES tensor_alloc data_stream TBB::tbb)
else()
	set(EXTRA_DEPENDENCIES tensor_alloc data_stream)
endif()

set(CONFIG_GPU_HADAMARD "10000,20000,30000,40000,50000,100000,500000,1000000,2000000,5000000,10000000,50000000,100000000")

set(progSrc hadamard.cpp main.cpp)

if(USE_TBB)
	message(STATUS "Activate TBB tests")
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O0 "-O0" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O1 "-O1" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O2 "-O2" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O3 "-O3" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_O4 "-O4" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	set(FLAG_VECTORIZATION "-mavx2 -ftree-vectorize -march=native -mtune=native")
	if(GPU_MODE)
		set(FLAG_VECTORIZATION "-mavx2")
	endif(GPU_MODE)
	phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O3 "-O3 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpupar_vectorize_O4 "-O4 ${FLAG_VECTORIZATION}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
endif(USE_TBB)

if(GPU_MODE)
	message(STATUS "Activate GPU NVC++ tests")
	# Minimum capabilities to use stdpar cc60
	set(GPU_EXTRA_FLAGS "-stdpar=gpu -std=c++17")
	set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${GPU_EXTRA_FLAGS}")
# 	set(GPU_EXTRA_FLAGS " -stdpar=gpu -gpu=cc60")
# 	nvc++-Fatal-nvc++-Fatal-The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80. The -stdpar option does not currently support compilation for multiple compute capabilities: 60 70 80
# 	set(GPU_EXTRA_FLAGS " -stdpar -gpu=cc50")	#capabilities for the quadro M2200
# 	set(CMAKE_LINK_LIBRARY_FLAG "${CMAKE_LINK_LIBRARY_FLAG} -Mcuda ")

	phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O1 "-O1 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	
	phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O3 "-O3 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc})
	phoenix_compileAndRunExample(perf_hadamard_gpu_stdpar_par_vectorize_O4 "-O4 ${GPU_EXTRA_FLAGS}" "${CONFIG_GPU_HADAMARD}" ${progSrc})

	phoenix_plotPerfLogX("hadamard_gpuparParallelGPU"
				perf_hadamard_gpu_stdpar_par_vectorize_O1
				perf_hadamard_gpu_stdpar_par_vectorize_O3	# Compile and works but not for quadro M2200 (too old)
				perf_hadamard_gpu_stdpar_par_vectorize_O4
				)
	if(USE_TBB)
		phoenix_plotPerfLogX("hadamard_gpuparParallelGPUcmp"
				perf_hadamard_gpupar_O3
				perf_hadamard_gpupar_vectorize_O3
				perf_hadamard_gpupar_vectorize_O4
				perf_hadamard_gpu_stdpar_par_vectorize_O3	# Compile and works but not for quadro M2200 (too old)
				perf_hadamard_gpu_stdpar_par_vectorize_O4
				)
		phoenix_plotPerfLogX("hadamard_gpuparBase" perf_hadamard_gpupar_O0 perf_hadamard_gpupar_O1 perf_hadamard_gpupar_O2 perf_hadamard_gpupar_O3 perf_hadamard_gpupar_O4)
		phoenix_plotPerfLogX("hadamard_gpuparVectorize" perf_hadamard_gpupar_O3 perf_hadamard_gpupar_vectorize_O3 perf_hadamard_gpupar_vectorize_O4)
	endif(USE_TBB)
endif(GPU_MODE)


Le fichier CMakeLists.txt est disponible ici.