onnxruntime
223 строки · 11.0 Кб
1# Copyright (c) Microsoft Corporation. All rights reserved.
2# Licensed under the MIT License.
3if(onnxruntime_DISABLE_CONTRIB_OPS)
4message( FATAL_ERROR "To compile TensorRT execution provider contrib ops have to be enabled to dump an engine using com.microsoft:EPContext node." )
5endif()
6add_definitions(-DUSE_TENSORRT=1)
7if (onnxruntime_TENSORRT_PLACEHOLDER_BUILDER)
8add_definitions(-DORT_TENSORRT_PLACEHOLDER_BUILDER)
9endif()
10set(BUILD_LIBRARY_ONLY 1)
11add_definitions("-DONNX_ML=1")
12add_definitions("-DONNX_NAMESPACE=onnx")
13set(CUDA_INCLUDE_DIRS ${CUDAToolkit_INCLUDE_DIRS})
14set(TENSORRT_ROOT ${onnxruntime_TENSORRT_HOME})
15set(OLD_CMAKE_CXX_FLAGS ${CMAKE_CXX_FLAGS})
16set(PROTOBUF_LIBRARY ${PROTOBUF_LIB})
17if (WIN32)
18set(OLD_CMAKE_CUDA_FLAGS ${CMAKE_CUDA_FLAGS})
19set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} /wd4099 /wd4551 /wd4505 /wd4515 /wd4706 /wd4456 /wd4324 /wd4701 /wd4804 /wd4702 /wd4458 /wd4703")
20if (CMAKE_BUILD_TYPE STREQUAL "Debug")
21set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} /wd4805")
22endif()
23set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -include algorithm")
24set(DISABLED_WARNINGS_FOR_TRT /wd4456)
25endif()
26if ( CMAKE_COMPILER_IS_GNUCC )
27set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-unused-parameter -Wno-missing-field-initializers")
28endif()
29set(CXX_VERSION_DEFINED TRUE)
30
31# There is an issue when running "Debug build" TRT EP with "Release build" TRT builtin parser on Windows.
32# We enforce following workaround for now until the real fix.
33if (WIN32 AND CMAKE_BUILD_TYPE STREQUAL "Debug")
34set(onnxruntime_USE_TENSORRT_BUILTIN_PARSER OFF)
35MESSAGE(STATUS "[Note] There is an issue when running \"Debug build\" TRT EP with \"Release build\" TRT built-in parser on Windows. This build will use tensorrt oss parser instead.")
36endif()
37
38find_path(TENSORRT_INCLUDE_DIR NvInfer.h
39HINTS ${TENSORRT_ROOT}
40PATH_SUFFIXES include)
41
42
43file(READ ${TENSORRT_INCLUDE_DIR}/NvInferVersion.h NVINFER_VER_CONTENT)
44string(REGEX MATCH "define NV_TENSORRT_MAJOR * +([0-9]+)" NV_TENSORRT_MAJOR "${NVINFER_VER_CONTENT}")
45string(REGEX REPLACE "define NV_TENSORRT_MAJOR * +([0-9]+)" "\\1" NV_TENSORRT_MAJOR "${NV_TENSORRT_MAJOR}")
46string(REGEX MATCH "define NV_TENSORRT_MINOR * +([0-9]+)" NV_TENSORRT_MINOR "${NVINFER_VER_CONTENT}")
47string(REGEX REPLACE "define NV_TENSORRT_MINOR * +([0-9]+)" "\\1" NV_TENSORRT_MINOR "${NV_TENSORRT_MINOR}")
48string(REGEX MATCH "define NV_TENSORRT_PATCH * +([0-9]+)" NV_TENSORRT_PATCH "${NVINFER_VER_CONTENT}")
49string(REGEX REPLACE "define NV_TENSORRT_PATCH * +([0-9]+)" "\\1" NV_TENSORRT_PATCH "${NV_TENSORRT_PATCH}")
50math(EXPR NV_TENSORRT_MAJOR_INT "${NV_TENSORRT_MAJOR}")
51math(EXPR NV_TENSORRT_MINOR_INT "${NV_TENSORRT_MINOR}")
52math(EXPR NV_TENSORRT_PATCH_INT "${NV_TENSORRT_PATCH}")
53
54if (NV_TENSORRT_MAJOR)
55MESSAGE(STATUS "NV_TENSORRT_MAJOR is ${NV_TENSORRT_MAJOR}")
56else()
57MESSAGE(STATUS "Can't find NV_TENSORRT_MAJOR macro")
58endif()
59
60# Check TRT version >= 10.0.1.6
61if ((NV_TENSORRT_MAJOR_INT GREATER 10) OR
62(NV_TENSORRT_MAJOR_INT EQUAL 10 AND NV_TENSORRT_MINOR_INT GREATER 0) OR
63(NV_TENSORRT_MAJOR_INT EQUAL 10 AND NV_TENSORRT_PATCH_INT GREATER 0))
64set(TRT_GREATER_OR_EQUAL_TRT_10_GA ON)
65endif()
66
67# TensorRT 10 GA onwards, the TensorRT libraries will have major version appended to the end on Windows,
68# for example, nvinfer_10.dll, nvinfer_plugin_10.dll, nvonnxparser_10.dll ...
69if (WIN32 AND TRT_GREATER_OR_EQUAL_TRT_10_GA)
70set(NVINFER_LIB "nvinfer_${NV_TENSORRT_MAJOR}")
71set(NVINFER_PLUGIN_LIB "nvinfer_plugin_${NV_TENSORRT_MAJOR}")
72set(PARSER_LIB "nvonnxparser_${NV_TENSORRT_MAJOR}")
73endif()
74
75if (NOT NVINFER_LIB)
76set(NVINFER_LIB "nvinfer")
77endif()
78
79if (NOT NVINFER_PLUGIN_LIB)
80set(NVINFER_PLUGIN_LIB "nvinfer_plugin")
81endif()
82
83if (NOT PARSER_LIB)
84set(PARSER_LIB "nvonnxparser")
85endif()
86
87MESSAGE(STATUS "Looking for ${NVINFER_LIB} and ${NVINFER_PLUGIN_LIB}")
88
89find_library(TENSORRT_LIBRARY_INFER ${NVINFER_LIB}
90HINTS ${TENSORRT_ROOT}
91PATH_SUFFIXES lib lib64 lib/x64)
92
93if (NOT TENSORRT_LIBRARY_INFER)
94MESSAGE(STATUS "Can't find ${NVINFER_LIB}")
95endif()
96
97find_library(TENSORRT_LIBRARY_INFER_PLUGIN ${NVINFER_PLUGIN_LIB}
98HINTS ${TENSORRT_ROOT}
99PATH_SUFFIXES lib lib64 lib/x64)
100
101if (NOT TENSORRT_LIBRARY_INFER_PLUGIN)
102MESSAGE(STATUS "Can't find ${NVINFER_PLUGIN_LIB}")
103endif()
104
105if (onnxruntime_USE_TENSORRT_BUILTIN_PARSER)
106MESSAGE(STATUS "Looking for ${PARSER_LIB}")
107
108find_library(TENSORRT_LIBRARY_NVONNXPARSER ${PARSER_LIB}
109HINTS ${TENSORRT_ROOT}
110PATH_SUFFIXES lib lib64 lib/x64)
111
112if (NOT TENSORRT_LIBRARY_NVONNXPARSER)
113MESSAGE(STATUS "Can't find ${PARSER_LIB}")
114endif()
115
116set(TENSORRT_LIBRARY ${TENSORRT_LIBRARY_INFER} ${TENSORRT_LIBRARY_INFER_PLUGIN} ${TENSORRT_LIBRARY_NVONNXPARSER})
117MESSAGE(STATUS "Find TensorRT libs at ${TENSORRT_LIBRARY}")
118else()
119if (TRT_GREATER_OR_EQUAL_TRT_10_GA)
120set(ONNX_USE_LITE_PROTO ON)
121endif()
122FetchContent_Declare(
123onnx_tensorrt
124URL ${DEP_URL_onnx_tensorrt}
125URL_HASH SHA1=${DEP_SHA1_onnx_tensorrt}
126)
127if (NOT CUDA_INCLUDE_DIR)
128set(CUDA_INCLUDE_DIR ${CUDAToolkit_INCLUDE_DIRS}) # onnx-tensorrt repo needs this variable to build
129endif()
130# The onnx_tensorrt repo contains a test program, getSupportedAPITest, which doesn't support Windows. It uses
131# unistd.h. So we must exclude it from our build. onnxruntime_fetchcontent_makeavailable is for the purpose.
132onnxruntime_fetchcontent_makeavailable(onnx_tensorrt)
133include_directories(${onnx_tensorrt_SOURCE_DIR})
134set(CMAKE_CXX_FLAGS ${OLD_CMAKE_CXX_FLAGS})
135if ( CMAKE_COMPILER_IS_GNUCC )
136set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-unused-parameter")
137endif()
138if (WIN32)
139set(CMAKE_CUDA_FLAGS ${OLD_CMAKE_CUDA_FLAGS})
140unset(PROTOBUF_LIBRARY)
141unset(OLD_CMAKE_CXX_FLAGS)
142unset(OLD_CMAKE_CUDA_FLAGS)
143set_target_properties(${PARSER_LIB} PROPERTIES LINK_FLAGS "/ignore:4199")
144target_compile_options(nvonnxparser_static PRIVATE /FIio.h /wd4100)
145target_compile_options(${PARSER_LIB} PRIVATE /FIio.h /wd4100)
146endif()
147# Static libraries are just nvonnxparser_static on all platforms
148set(onnxparser_link_libs nvonnxparser_static)
149set(TENSORRT_LIBRARY ${TENSORRT_LIBRARY_INFER} ${TENSORRT_LIBRARY_INFER_PLUGIN})
150MESSAGE(STATUS "Find TensorRT libs at ${TENSORRT_LIBRARY}")
151endif()
152
153include_directories(${TENSORRT_INCLUDE_DIR})
154# ${TENSORRT_LIBRARY} is empty if we link nvonnxparser_static.
155# nvonnxparser_static is linked against tensorrt libraries in onnx-tensorrt
156# See https://github.com/onnx/onnx-tensorrt/blob/8af13d1b106f58df1e98945a5e7c851ddb5f0791/CMakeLists.txt#L121
157# However, starting from TRT 10 GA, nvonnxparser_static doesn't link against tensorrt libraries.
158# Therefore, the above code finds ${TENSORRT_LIBRARY_INFER} and ${TENSORRT_LIBRARY_INFER_PLUGIN}.
159if(onnxruntime_CUDA_MINIMAL)
160set(trt_link_libs ${CMAKE_DL_LIBS} ${TENSORRT_LIBRARY})
161else()
162set(trt_link_libs CUDNN::cudnn_all cublas ${CMAKE_DL_LIBS} ${TENSORRT_LIBRARY})
163endif()
164file(GLOB_RECURSE onnxruntime_providers_tensorrt_cc_srcs CONFIGURE_DEPENDS
165"${ONNXRUNTIME_ROOT}/core/providers/tensorrt/*.h"
166"${ONNXRUNTIME_ROOT}/core/providers/tensorrt/*.cc"
167"${ONNXRUNTIME_ROOT}/core/providers/shared_library/*.h"
168"${ONNXRUNTIME_ROOT}/core/providers/shared_library/*.cc"
169"${ONNXRUNTIME_ROOT}/core/providers/cuda/cuda_stream_handle.h"
170"${ONNXRUNTIME_ROOT}/core/providers/cuda/cuda_stream_handle.cc"
171"${ONNXRUNTIME_ROOT}/core/providers/cuda/cuda_graph.h"
172"${ONNXRUNTIME_ROOT}/core/providers/cuda/cuda_graph.cc"
173)
174
175source_group(TREE ${ONNXRUNTIME_ROOT}/core FILES ${onnxruntime_providers_tensorrt_cc_srcs})
176onnxruntime_add_shared_library_module(onnxruntime_providers_tensorrt ${onnxruntime_providers_tensorrt_cc_srcs})
177onnxruntime_add_include_to_target(onnxruntime_providers_tensorrt onnxruntime_common onnx flatbuffers::flatbuffers Boost::mp11 safeint_interface)
178add_dependencies(onnxruntime_providers_tensorrt onnxruntime_providers_shared ${onnxruntime_EXTERNAL_DEPENDENCIES})
179if (onnxruntime_USE_TENSORRT_BUILTIN_PARSER)
180target_link_libraries(onnxruntime_providers_tensorrt PRIVATE ${trt_link_libs} ${ONNXRUNTIME_PROVIDERS_SHARED} ${PROTOBUF_LIB} flatbuffers::flatbuffers Boost::mp11 safeint_interface ${ABSEIL_LIBS} PUBLIC CUDA::cudart)
181else()
182target_link_libraries(onnxruntime_providers_tensorrt PRIVATE ${onnxparser_link_libs} ${trt_link_libs} ${ONNXRUNTIME_PROVIDERS_SHARED} ${PROTOBUF_LIB} flatbuffers::flatbuffers ${ABSEIL_LIBS} PUBLIC CUDA::cudart)
183endif()
184target_include_directories(onnxruntime_providers_tensorrt PRIVATE ${ONNXRUNTIME_ROOT} ${CMAKE_CURRENT_BINARY_DIR} ${eigen_INCLUDE_DIRS}
185PUBLIC ${CUDAToolkit_INCLUDE_DIRS})
186
187# ${CMAKE_CURRENT_BINARY_DIR} is so that #include "onnxruntime_config.h" inside tensor_shape.h is found
188set_target_properties(onnxruntime_providers_tensorrt PROPERTIES LINKER_LANGUAGE CUDA)
189set_target_properties(onnxruntime_providers_tensorrt PROPERTIES FOLDER "ONNXRuntime")
190target_compile_definitions(onnxruntime_providers_tensorrt PRIVATE ONNXIFI_BUILD_LIBRARY=1)
191target_compile_options(onnxruntime_providers_tensorrt PRIVATE ${DISABLED_WARNINGS_FOR_TRT})
192if (WIN32)
193target_compile_options(onnxruntime_providers_tensorrt INTERFACE /wd4456)
194endif()
195if(onnxruntime_CUDA_MINIMAL)
196target_compile_definitions(onnxruntime_providers_tensorrt PRIVATE USE_CUDA_MINIMAL=1)
197endif()
198
199# Needed for the provider interface, as it includes training headers when training is enabled
200if (onnxruntime_ENABLE_TRAINING_OPS)
201target_include_directories(onnxruntime_providers_tensorrt PRIVATE ${ORTTRAINING_ROOT})
202if (onnxruntime_ENABLE_TRAINING_TORCH_INTEROP)
203onnxruntime_add_include_to_target(onnxruntime_providers_tensorrt Python::Module)
204endif()
205endif()
206
207if(APPLE)
208set_property(TARGET onnxruntime_providers_tensorrt APPEND_STRING PROPERTY LINK_FLAGS "-Xlinker -exported_symbols_list ${ONNXRUNTIME_ROOT}/core/providers/tensorrt/exported_symbols.lst")
209target_link_libraries(onnxruntime_providers_tensorrt PRIVATE nsync::nsync_cpp)
210elseif(UNIX)
211set_property(TARGET onnxruntime_providers_tensorrt APPEND_STRING PROPERTY COMPILE_FLAGS "-Wno-deprecated-declarations")
212set_property(TARGET onnxruntime_providers_tensorrt APPEND_STRING PROPERTY LINK_FLAGS "-Xlinker --version-script=${ONNXRUNTIME_ROOT}/core/providers/tensorrt/version_script.lds -Xlinker --gc-sections")
213target_link_libraries(onnxruntime_providers_tensorrt PRIVATE nsync::nsync_cpp)
214elseif(WIN32)
215set_property(TARGET onnxruntime_providers_tensorrt APPEND_STRING PROPERTY LINK_FLAGS "-DEF:${ONNXRUNTIME_ROOT}/core/providers/tensorrt/symbols.def")
216else()
217message(FATAL_ERROR "onnxruntime_providers_tensorrt unknown platform, need to specify shared library exports for it")
218endif()
219
220install(TARGETS onnxruntime_providers_tensorrt
221ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
222LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
223RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR})
224