-
Notifications
You must be signed in to change notification settings - Fork 280
Expand file tree
/
Copy pathCMakeLists.txt
More file actions
351 lines (295 loc) · 14.7 KB
/
CMakeLists.txt
File metadata and controls
351 lines (295 loc) · 14.7 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
# Copyright (c) Microsoft Corporation. All rights reserved.
# Licensed under the MIT License.
if(CMAKE_SYSTEM_NAME STREQUAL "Darwin")
# For xcframework support
cmake_minimum_required(VERSION 3.28)
else()
cmake_minimum_required(VERSION 3.26)
endif()
include(FetchContent)
include(CMakeDependentOption)
project(Generators LANGUAGES C CXX)
# All Options should be defined in cmake/options.cmake This must be included before any other cmake file is included
include(cmake/options.cmake)
if("${CMAKE_C_COMPILER_ID}" STREQUAL "GNU" AND CMAKE_C_COMPILER_VERSION VERSION_LESS 11)
message(FATAL_ERROR "GCC version must be greater than or equal to 11")
endif()
# Avoid warning of Calling FetchContent_Populate(Lib) is deprecated temporarily
# TODO: find a better way to handle the header-only 3rd party deps
if(CMAKE_VERSION VERSION_GREATER_EQUAL "3.30.0")
cmake_policy(SET CMP0169 OLD)
endif()
if(MSVC)
# Add compiler options for security standards
# Note: Must use separate generator expressions — do NOT use "C,CXX" in COMPILE_LANGUAGE.
# Explicitly enable (/GS) stack protection to pass BinSkim checks
add_compile_options("$<$<COMPILE_LANGUAGE:C>:/GS>")
add_compile_options("$<$<COMPILE_LANGUAGE:CXX>:/GS>")
# Enable Control Flow Guard on compiler and linker to pass BinSkim checks
add_compile_options("$<$<COMPILE_LANGUAGE:C>:/guard:cf>")
add_compile_options("$<$<COMPILE_LANGUAGE:CXX>:/guard:cf>")
add_link_options(/guard:cf /DYNAMICBASE)
# Determine the target platform (from MSBuild generator)
if (CMAKE_VS_PLATFORM_NAME)
set(onnxruntime_target_platform ${CMAKE_VS_PLATFORM_NAME})
else()
set(onnxruntime_target_platform ${CMAKE_SYSTEM_PROCESSOR})
endif()
# Enable CET shadow stack unless building for ARM64 (not supported there)
if (onnxruntime_target_platform STREQUAL "x64" OR
onnxruntime_target_platform STREQUAL "Win32" OR
onnxruntime_target_platform STREQUAL "x86")
add_link_options("/CETCOMPAT")
message(STATUS "CET shadow stack enabled (/CETCOMPAT).")
else()
message(STATUS "CET shadow stack skipped.")
endif()
# Enable Spectre mitigations for C and C++ compilations only (avoid CUDA nvcc that is not supported there)
add_compile_options(
"$<$<COMPILE_LANGUAGE:C>:/Qspectre>"
"$<$<COMPILE_LANGUAGE:CXX>:/Qspectre>"
)
# Use updated value for __cplusplus macro (e.g. 201703L for C++17) instead of default 199711L
# Required by some libraries/tools that check __cplusplus for feature support
add_compile_options($<$<COMPILE_LANGUAGE:CXX>:/Zc:__cplusplus>)
add_compile_options(
# Suppress warning C5038: data member will be initialized after another
# Common when member initializer list is written out-of-order vs. declaration
"$<$<COMPILE_LANGUAGE:C>:/w15038>"
"$<$<COMPILE_LANGUAGE:CXX>:/w15038>"
# Suppress warning C4100: unreferenced formal parameter
# Often appears in template or virtual function overrides where a param is unused
"$<$<COMPILE_LANGUAGE:C>:/wd4100>"
"$<$<COMPILE_LANGUAGE:CXX>:/wd4100>"
# Suppress warning C4819: file contains character that cannot be represented in current code page
"$<$<COMPILE_LANGUAGE:C>:/wd4819>"
"$<$<COMPILE_LANGUAGE:CXX>:/wd4819>"
# Suppress warning C4996: use of deprecated function or variable
"$<$<COMPILE_LANGUAGE:C>:/wd4996>"
"$<$<COMPILE_LANGUAGE:CXX>:/wd4996>"
# Enable warning level 4 (more aggressive than default /W3)
# Captures more potential bugs or code smells
"$<$<COMPILE_LANGUAGE:C>:/W4>"
"$<$<COMPILE_LANGUAGE:CXX>:/W4>"
# Treat all warnings as errors (fail build on any warning)
# Combine carefully with /W4 — suppress any known false positives
"$<$<COMPILE_LANGUAGE:C>:/WX>"
"$<$<COMPILE_LANGUAGE:CXX>:/WX>"
)
endif()
include(cmake/ortlib.cmake)
include(cmake/external/onnxruntime_external_deps.cmake)
# All Global variables, including GLOB, for the top level CMakeLists.txt should be defined here
include(cmake/global_variables.cmake)
# Checking if CUDA is supported
include(cmake/check_cuda.cmake)
# Checking if ROCm is supported
include(cmake/check_rocm.cmake)
# Checking if DML is supported
include(cmake/check_dml.cmake)
include(cmake/cxx_standard.cmake)
add_compile_definitions(BUILDING_ORT_GENAI_C)
add_compile_definitions(USE_GUIDANCE=$<BOOL:${USE_GUIDANCE}>)
# Suggested by https://gitlab.kitware.com/cmake/cmake/-/issues/20132
# MacCatalyst is not well supported in CMake
# The error that can emerge without this flag can look like:
# "clang : error : overriding '-mmacosx-version-min=11.0' option with '-target x86_64-apple-ios14.0-macabi' [-Werror,-Woverriding-t-option]"
if (PLATFORM_NAME STREQUAL "macabi")
add_compile_options(-Wno-overriding-t-option)
add_link_options(-Wno-overriding-t-option)
endif()
if(ENABLE_TESTS)
# call enable_testing so we can add tests from subdirectories (e.g. test and src/java)
# it applies recursively to all subdirectories
enable_testing()
if (TEST_PHI2)
add_compile_definitions(TEST_PHI2=1)
else()
add_compile_definitions(TEST_PHI2=0)
endif()
if (TEST_QWEN_2_5)
add_compile_definitions(TEST_QWEN_2_5=1)
else()
add_compile_definitions(TEST_QWEN_2_5=0)
endif()
if (USE_WEBGPU)
add_compile_definitions(USE_WEBGPU=1)
else()
add_compile_definitions(USE_WEBGPU=0)
endif()
endif()
if(ENABLE_TRACING)
message(STATUS "Tracing is enabled.")
add_compile_definitions(ORTGENAI_ENABLE_TRACING)
endif()
find_package(Threads REQUIRED)
if(WIN32)
add_library(onnxruntime-genai SHARED ${generator_srcs} "${GENERATORS_ROOT}/dll/onnxruntime-genai.rc")
target_compile_definitions(onnxruntime-genai PRIVATE VERSION_INFO=\"${VERSION_INFO}\")
target_compile_definitions(onnxruntime-genai PRIVATE VERSION_MAJOR=${VERSION_MAJOR})
target_compile_definitions(onnxruntime-genai PRIVATE VERSION_MINOR=${VERSION_MINOR})
target_compile_definitions(onnxruntime-genai PRIVATE VERSION_PATCH=${VERSION_PATCH})
target_compile_definitions(onnxruntime-genai PRIVATE VERSION_SUFFIX=${VERSION_SUFFIX})
target_compile_definitions(onnxruntime-genai PRIVATE FILE_NAME=\"onnxruntime-genai.dll\")
else()
add_library(onnxruntime-genai SHARED ${generator_srcs})
endif()
target_include_directories(onnxruntime-genai PRIVATE ${ORT_HEADER_DIR})
target_include_directories(onnxruntime-genai PRIVATE ${onnxruntime_extensions_SOURCE_DIR}/shared/api)
target_link_libraries(onnxruntime-genai PRIVATE onnxruntime_extensions)
target_link_directories(onnxruntime-genai PRIVATE ${ORT_LIB_DIR})
target_link_libraries(onnxruntime-genai PRIVATE Threads::Threads)
# The genai library itself is always embedded in the shared library
list(APPEND ortgenai_embed_libs "$<TARGET_FILE:onnxruntime-genai>")
# we keep the shared libraries disconnected on Android as they will come from separate AARs and we don't want to force
# the ORT version to match in both.
if(CMAKE_SYSTEM_NAME STREQUAL "Android" OR CMAKE_SYSTEM_NAME STREQUAL "Linux" OR (CMAKE_SYSTEM_NAME STREQUAL "Darwin" AND (NOT BUILD_APPLE_FRAMEWORK) AND (NOT MAC_CATALYST)))
add_compile_definitions(_ORT_GENAI_USE_DLOPEN)
else()
target_link_libraries(onnxruntime-genai PRIVATE ${ONNXRUNTIME_LIB})
if(USE_WINML)
target_link_options(onnxruntime-genai PRIVATE "/DELAYLOAD:${ONNXRUNTIME_LIB}")
endif()
endif()
if(APPLE)
target_link_libraries(onnxruntime-genai PRIVATE "-framework Foundation" "-framework CoreML")
endif()
# Build all source files using CUDA as a separate shared library we dynamically load at runtime
if((USE_CUDA OR USE_TRT_RTX) AND CMAKE_CUDA_COMPILER)
# Suppress nvcc warnings:
# 1650 = "result of call is not used"
# 221 = "floating-point value does not fit in required floating-point type"
# Also suppress deprecated GPU targets warnings for CUDA 12.8+
add_compile_options(
$<$<COMPILE_LANGUAGE:CUDA>:-diag-suppress=1650>
$<$<COMPILE_LANGUAGE:CUDA>:-diag-suppress=221>
$<$<COMPILE_LANGUAGE:CUDA>:-Wno-deprecated-gpu-targets>
$<$<AND:$<COMPILE_LANGUAGE:CUDA>,$<CXX_COMPILER_ID:MSVC>>:-Xcompiler=/wd4996>
)
if(WIN32)
add_library(onnxruntime-genai-cuda SHARED ${generator_cudalib_srcs} "${GENERATORS_ROOT}/dll/onnxruntime-genai.rc")
target_compile_definitions(onnxruntime-genai-cuda PRIVATE VERSION_INFO=\"${VERSION_INFO}\")
target_compile_definitions(onnxruntime-genai-cuda PRIVATE VERSION_MAJOR=${VERSION_MAJOR})
target_compile_definitions(onnxruntime-genai-cuda PRIVATE VERSION_MINOR=${VERSION_MINOR})
target_compile_definitions(onnxruntime-genai-cuda PRIVATE VERSION_PATCH=${VERSION_PATCH})
target_compile_definitions(onnxruntime-genai-cuda PRIVATE VERSION_SUFFIX=${VERSION_SUFFIX})
target_compile_definitions(onnxruntime-genai-cuda PRIVATE FILE_NAME=\"onnxruntime-genai-cuda.dll\")
else()
add_library(onnxruntime-genai-cuda SHARED ${generator_cudalib_srcs})
endif()
target_include_directories(onnxruntime-genai-cuda PRIVATE ${ORT_HEADER_DIR})
target_include_directories(onnxruntime-genai-cuda PRIVATE ${GENERATORS_ROOT})
target_link_libraries(onnxruntime-genai-cuda PRIVATE cublasLt cublas curand cufft cudart)
set_target_properties(onnxruntime-genai-cuda PROPERTIES LINKER_LANGUAGE CUDA)
add_dependencies(onnxruntime-genai onnxruntime-genai-cuda)
source_group(TREE ${GENERATORS_ROOT}/cuda FILES ${generator_cudalib_srcs})
list(APPEND ortgenai_embed_libs "$<TARGET_FILE:onnxruntime-genai-cuda>")
if(APPLE)
set_property(TARGET onnxruntime-genai-cuda APPEND_STRING PROPERTY LINK_FLAGS "-Xlinker -exported_symbols_list ${GENERATORS_ROOT}/cuda/exported_symbols.lst")
elseif(UNIX)
set_property(TARGET onnxruntime-genai-cuda APPEND_STRING PROPERTY LINK_FLAGS "-Xlinker --version-script=${GENERATORS_ROOT}/cuda/version_script.lds -Xlinker --gc-sections")
elseif(WIN32)
set_property(TARGET onnxruntime-genai-cuda APPEND_STRING PROPERTY LINK_FLAGS "-DEF:${GENERATORS_ROOT}/cuda/symbols.def")
else()
message(FATAL_ERROR "${target} unknown platform, need to specify shared library exports for it")
endif()
endif()
if(USE_GUIDANCE)
target_include_directories(onnxruntime-genai PUBLIC ${llguidance_SOURCE_DIR}/parser/)
target_link_libraries(onnxruntime-genai PRIVATE llguidance)
if (WIN32)
# bcrypt is needed for the rust std lib
target_link_libraries(onnxruntime-genai PRIVATE bcrypt)
endif()
if(MSVC)
# The Rust llguidance static library is always compiled against the release MSVC CRT
# (Rust has no debug CRT concept). The .lib embeds /DEFAULTLIB directives for the release
# CRT and /NODEFAULTLIB directives that suppress the debug CRT (msvcrtd, ucrtd, vcruntimed).
# In Debug builds, C++ code (e.g. onnxruntime-extensions) is compiled with /MDd and references
# debug-only CRT functions like _CrtDbgReport (in ucrtd.lib). Because the Rust .lib suppresses
# ucrtd.lib via its embedded /NODEFAULTLIB, _CrtDbgReport becomes unresolved.
#
# Fix: explicitly add the debug CRT import libraries in Debug builds. Explicitly specified
# libraries are not affected by /NODEFAULTLIB directives (those only suppress /DEFAULTLIB
# auto-linking). Also suppress the conflicting release CRT to avoid LNK4098 warnings.
target_link_libraries(onnxruntime-genai PRIVATE
$<$<CONFIG:Debug>:msvcrtd.lib>
$<$<CONFIG:Debug>:ucrtd.lib>
$<$<CONFIG:Debug>:vcruntimed.lib>
)
target_link_options(onnxruntime-genai PRIVATE
$<$<CONFIG:Debug>:/NODEFAULTLIB:msvcrt.lib>
$<$<CONFIG:Debug>:/NODEFAULTLIB:ucrt.lib>
$<$<CONFIG:Debug>:/NODEFAULTLIB:vcruntime.lib>
$<$<CONFIG:Debug>:/NODEFAULTLIB:libcmt.lib>
$<$<CONFIG:Debug>:/NODEFAULTLIB:libucrt.lib>
$<$<CONFIG:Debug>:/NODEFAULTLIB:libvcruntime.lib>
)
endif()
endif()
if(CMAKE_GENERATOR_TOOLSET MATCHES "Visual Studio")
target_compile_options(onnxruntime-genai PRIVATE "/sdl")
endif()
if(CMAKE_SYSTEM_NAME STREQUAL "Linux")
set_target_properties(onnxruntime-genai PROPERTIES POSITION_INDEPENDENT_CODE ON)
target_link_libraries(onnxruntime-genai PUBLIC dl) # For dlopen & co
endif()
if(USE_DML)
list(APPEND ortgenai_embed_libs "${D3D12_LIB_DIR}/D3D12Core.dll")
target_include_directories(onnxruntime-genai PRIVATE $<TARGET_PROPERTY:${WIL_TARGET},INTERFACE_INCLUDE_DIRECTORIES>)
target_include_directories(onnxruntime-genai PRIVATE $<TARGET_PROPERTY:${DIRECTX_HEADERS_TARGET},INTERFACE_INCLUDE_DIRECTORIES>/directx)
target_include_directories(onnxruntime-genai PRIVATE $<TARGET_PROPERTY:${DIRECTX_HEADERS_TARGET},INTERFACE_INCLUDE_DIRECTORIES>)
target_include_directories(onnxruntime-genai PRIVATE ${DML_HEADER_DIR})
target_include_directories(onnxruntime-genai PRIVATE ${D3D12_HEADER_DIR})
target_link_directories(onnxruntime-genai PRIVATE ${DML_LIB_DIR})
target_link_directories(onnxruntime-genai PRIVATE ${D3D12_LIB_DIR})
target_link_libraries(onnxruntime-genai PRIVATE d3d12.lib dxcore.lib dxguid.lib dxgi.lib)
get_filename_component(PACKAGES_DIR ${CMAKE_CURRENT_BINARY_DIR}/_deps ABSOLUTE)
set(DXC_PACKAGE_DIR ${PACKAGES_DIR}/Microsoft.Direct3D.DXC.1.7.2308.12)
set(NUGET_CONFIG ${PROJECT_SOURCE_DIR}/nuget.config)
set(PACKAGES_CONFIG ${PROJECT_SOURCE_DIR}/packages.config)
add_custom_command(
OUTPUT
${DXC_PACKAGE_DIR}/build/native/bin/x64/dxc.exe
DEPENDS
${PACKAGES_CONFIG}
${NUGET_CONFIG}
COMMAND ${CMAKE_CURRENT_BINARY_DIR}/nuget/src/nuget restore ${PACKAGES_CONFIG} -PackagesDirectory ${PACKAGES_DIR} -ConfigFile ${NUGET_CONFIG}
VERBATIM
)
add_custom_target(
RESTORE_PACKAGES ALL
DEPENDS
${DXC_PACKAGE_DIR}/build/native/bin/x64/dxc.exe
)
add_dependencies(RESTORE_PACKAGES nuget)
add_dependencies(onnxruntime-genai RESTORE_PACKAGES)
endif()
if(ANDROID)
# strip the binary if it's not a build with debug info
set_target_properties(onnxruntime-genai PROPERTIES LINK_FLAGS_RELEASE -s)
set_target_properties(onnxruntime-genai PROPERTIES LINK_FLAGS_MINSIZEREL -s)
# Build shared libraries with support for 16 KB page size on Android
# https://source.android.com/docs/core/architecture/16kb-page-size/16kb#build-lib-16kb-alignment
set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -Wl,-z,max-page-size=16384")
set(CMAKE_MODULE_LINKER_FLAGS "${CMAKE_MODULE_LINKER_FLAGS} -Wl,-z,max-page-size=16384")
endif()
if(ENABLE_TESTS)
message("------------------Enabling tests------------------")
add_subdirectory("${REPO_ROOT}/test")
endif()
if(ENABLE_PYTHON)
message("------------------Enabling Python Wheel------------------")
add_subdirectory("${SRC_ROOT}/python")
endif()
if (ENABLE_JAVA)
message("------------------Enabling Java Jar------------------")
add_subdirectory("${SRC_ROOT}/java")
endif()
if(ENABLE_MODEL_BENCHMARK)
message("------------------Enabling model benchmark------------------")
add_subdirectory("${REPO_ROOT}/benchmark/c")
endif()
# Have visual studio put all files into one single folder vs the default split of header files into a separate folder
source_group(TREE ${GENERATORS_ROOT} FILES ${generator_srcs})
include(cmake/package.cmake)