forked from hank-ai/darknet
-
Notifications
You must be signed in to change notification settings - Fork 0
/
CM_dependencies.cmake
175 lines (155 loc) · 5.97 KB
/
CM_dependencies.cmake
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
# Darknet object detection framework
# ==========
# == CUDA ==
# ==========
CHECK_LANGUAGE (CUDA)
IF (CMAKE_CUDA_COMPILER)
MESSAGE (STATUS "CUDA detected. Darknet will use the GPU.")
ENABLE_LANGUAGE (CUDA)
FIND_PACKAGE(CUDAToolkit)
INCLUDE_DIRECTORIES (${CUDAToolkit_INCLUDE_DIRS})
ADD_COMPILE_DEFINITIONS (GPU) # TODO rename this to DARKNET_USE_GPU or DARKNET_USE_CUDA?
SET (CMAKE_CUDA_STANDARD 17)
SET (CMAKE_CUDA_STANDARD_REQUIRED ON)
#
# Best to use "native" as the architecture, as this will use whatever GPU is installed.
# But if desired, the exact major architecture index can also be specified. For example:
#
# (note that some of these are no longer supported in recent versions of CUDA)
#
# 20: GeForce 400, 500, 600, GT-630
# 30: GeForce 700, GT 730, 740, 760, 770
# 35: Tesla K40
# 37: Tesla K80
# 50: Tesla Quadro M
# 52: Quadro M6000, GeForce 900, 970, 980, Titan X
# 53: Tegra Jetson TX1, X1, Drive CX, Drive PX, Jetson Nano
# 60: Quadro GP100, Tesla P100, DGX-1
# 61: GTX 1080, 1070, 1060, 1050, 1030, 1010, GP108 Titan Xp, Tesla P40, Tesla P4, Drive PX2
# 62: Drive PX2, Tegra Jetson TX2
# 70: DGX-1 Volta, Tesla V100, GTX 1180 GV104, Titan V, Quadro VG100
# 72: Jetson AGX Xavier, AGX Pegasus, Jetson Xavier NX
# 75: GTX RTX Turing, GTX 1660, RTX 2060, RTX 2070, RTX 2080, Titan RTX, Quadro RTX 4000, 5000, 6000, 8000, T1000, T2000, Tesla T4, XNOR Tensor Cores
# 80: A100, GA100, DGX-A100, RTX 3080 (?)
# 86: Tesla GA10x, RTX Ampere, RTX 3050, 3070, 3080, 3090, GA102, GA107, RTX A2000, A3000, A4000, A5000, A6000, A40, GA106, RTX 3060, GA104, A10, A16, A40, A2 Tensor
# 87: Jetson AGX Orin, Drive AGX Orin
# 89: RTX 4090, 4080, 6000, Tesla L40
# 90: H100, GH100
#
# SET (DARKNET_CUDA_ARCHITECTURES "86")
# SET (DARKNET_CUDA_ARCHITECTURES "75;80;86")
SET (DARKNET_CUDA_ARCHITECTURES "native")
SET (DARKNET_USE_CUDA ON)
SET (DARKNET_LINK_LIBS ${DARKNET_LINK_LIBS} CUDA::cudart CUDA::cuda_driver CUDA::cublas CUDA::curand)
ELSE ()
MESSAGE (WARNING "CUDA not found. Darknet will be CPU-only.")
ENDIF ()
# ===========
# == cuDNN ==
# ===========
IF (DARKNET_USE_CUDA)
# Look for cudnn, we will look in the same place as other CUDA libraries and also a few other places as well.
FIND_PATH(cudnn_include cudnn.h
HINTS ${CUDA_INCLUDE_DIRS} ENV CUDNN_INCLUDE_DIR ENV CUDA_PATH ENV CUDNN_HOME
PATHS /usr/local /usr/local/cuda ENV CPATH
PATH_SUFFIXES include)
GET_FILENAME_COMPONENT(cudnn_hint_path "${CUDA_CUBLAS_LIBRARIES}" PATH)
FIND_LIBRARY(cudnn cudnn
HINTS ${cudnn_hint_path} ENV CUDNN_LIBRARY_DIR ENV CUDA_PATH ENV CUDNN_HOME
PATHS /usr/local /usr/local/cuda ENV LD_LIBRARY_PATH
PATH_SUFFIXES lib64 lib/x64 lib x64)
IF (cudnn AND cudnn_include)
MESSAGE (STATUS "Found cuDNN library: " ${cudnn})
ADD_COMPILE_DEFINITIONS (CUDNN) # TODO this needs to be renamed
ADD_COMPILE_DEFINITIONS (CUDNN_HALF)
SET (DARKNET_LINK_LIBS ${DARKNET_LINK_LIBS} ${cudnn})
MESSAGE (STATUS "Found cuDNN include: " ${cudnn_include})
INCLUDE_DIRECTORIES (${cudnn_include})
ELSE ()
MESSAGE (WARNING "cuDNN not found.")
ENDIF ()
ENDIF ()
# ========================
# == Intel/AMD Hardware ==
# ========================
IF (CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "x86" OR
CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "x86_32" OR
CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "x86_64" OR
CMAKE_HOST_SYSTEM_PROCESSOR MATCHES "AMD64")
SET (HARDWARE_IS_X86 TRUE)
MESSAGE (STATUS "Hardware is 32-bit or 64-bit, and seems to be Intel or AMD: ${CMAKE_HOST_SYSTEM_PROCESSOR}")
ELSE ()
SET (HARDWARE_IS_X86 FALSE)
MESSAGE (STATUS "Hardware does not appear to be 32-bit or 64-bit, Intel or AMD: ${CMAKE_HOST_SYSTEM_PROCESSOR}")
ENDIF ()
# ===============
# == GCC/Clang ==
# ===============
IF (CMAKE_COMPILER_IS_GNUCC OR "${CMAKE_CXX_COMPILER_ID}" MATCHES "Clang")
SET (COMPILER_IS_GNU_OR_CLANG TRUE)
ELSE ()
SET (COMPILER_IS_GNU_OR_CLANG FALSE)
ENDIF ()
# ====================
# == GCC/Clang/MSCV ==
# ====================
IF (COMPILER_IS_GNU_OR_CLANG OR "${CMAKE_CXX_COMPILER_ID}" MATCHES "MSVC")
SET (COMPILER_IS_GNU_OR_CLANG_OR_MSVC TRUE)
ELSE ()
SET (COMPILER_IS_GNU_OR_CLANG_OR_MSVC FALSE)
ENDIF ()
# =============
# == Threads ==
# =============
FIND_PACKAGE (Threads REQUIRED)
MESSAGE (STATUS "Found Threads ${Threads_VERSION}")
SET (DARKNET_LINK_LIBS ${DARKNET_LINK_LIBS} Threads::Threads)
# ============
# == OpenCV ==
# ============
FIND_PACKAGE (OpenCV CONFIG REQUIRED)
MESSAGE (STATUS "Found OpenCV ${OpenCV_VERSION}")
INCLUDE_DIRECTORIES (${OpenCV_INCLUDE_DIRS})
SET (DARKNET_LINK_LIBS ${DARKNET_LINK_LIBS} ${OpenCV_LIBS})
# ============
# == OpenMP ==
# ============
FIND_PACKAGE (OpenMP QUIET) # optional
IF (NOT OPENMP_FOUND)
MESSAGE (WARNING "OpenMP not found. Building Darknet without support for OpenMP.")
ELSE ()
MESSAGE (STATUS "Found OpenMP ${OpenMP_VERSION}")
ADD_COMPILE_DEFINITIONS (OPENMP)
SET (DARKNET_LINK_LIBS ${DARKNET_LINK_LIBS} OpenMP::OpenMP_CXX OpenMP::OpenMP_C)
IF (COMPILER_IS_GNU_OR_CLANG)
ADD_COMPILE_OPTIONS(-fopenmp)
ENDIF ()
ENDIF ()
# ===============
# == AVX & SSE ==
# ===============
CMAKE_DEPENDENT_OPTION (ENABLE_SSE_AND_AVX "Enable AVX and SSE optimizations (Intel and AMD only)" ON "COMPILER_IS_GNU_OR_CLANG_OR_MSVC;HARDWARE_IS_X86" OFF)
IF (NOT ENABLE_SSE_AND_AVX)
MESSAGE (WARNING "AVX and SSE optimizations are disabled.")
ELSE ()
MESSAGE (STATUS "Enabling AVX and SSE optimizations.")
IF (COMPILER_IS_GNU_OR_CLANG)
ADD_COMPILE_OPTIONS(-ffp-contract=fast)
ADD_COMPILE_OPTIONS(-mavx)
ADD_COMPILE_OPTIONS(-mavx2)
ADD_COMPILE_OPTIONS(-msse3)
ADD_COMPILE_OPTIONS(-msse4.1)
ADD_COMPILE_OPTIONS(-msse4.2)
ADD_COMPILE_OPTIONS(-msse4a)
ELSE ()
SET (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} /arch:AVX2")
ENDIF()
ENDIF ()
# ============
# == Timing ==
# ============
CMAKE_DEPENDENT_OPTION (ENABLE_TIMING_AND_TRACKING "Enable Darknet timing and tracking debugging" OFF "" OFF)
IF (ENABLE_TIMING_AND_TRACKING)
MESSAGE (WARNING "Darknet timing and tracking debug code is *ENABLED*!")
ADD_COMPILE_DEFINITIONS(DARKNET_TIMING_AND_TRACKING_ENABLED)
ENDIF ()