Skip to content

Commit beb1a92

Browse files
amarin16edgchen1yf711ankitm3kn1harika
authored
Cherry-picks into rel-1.21.0 (#23846)
Cherry-pick the following changes into [rel-1.21.0](https://github.com/microsoft/onnxruntime/tree/rel-1.21.0). - (#23791) - (#23710) - (#23789) - (#23829) --------- Co-authored-by: Edward Chen <[email protected]> Co-authored-by: Yifan Li <[email protected]> Co-authored-by: Ankit Maheshkar <[email protected]> Co-authored-by: n1harika <[email protected]> Co-authored-by: Changming Sun <[email protected]>
1 parent 98511b0 commit beb1a92

File tree

11 files changed

+156
-59
lines changed

11 files changed

+156
-59
lines changed

cmake/deps.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ mimalloc;https://github.com/microsoft/mimalloc/archive/refs/tags/v2.1.1.zip;d5ee
3737
mp11;https://github.com/boostorg/mp11/archive/refs/tags/boost-1.82.0.zip;9bc9e01dffb64d9e0773b2e44d2f22c51aace063
3838
onnx;https://github.com/onnx/onnx/archive/refs/tags/v1.17.0.zip;13a60ac5217c104139ce0fd024f48628e7bcf5bc
3939
# Use the latest commit of 10.8-GA
40-
onnx_tensorrt;https://github.com/onnx/onnx-tensorrt/archive/118ed0aea197fa9a7d3ea66180a1d5ddb9deecc3.zip;b78aed3728ad4daf6dc47ea10c1d243dee1d95b1
40+
onnx_tensorrt;https://github.com/onnx/onnx-tensorrt/archive/c5ca8912f30e9ad630a0ef565e3d5f4bd5e91563.zip;588b294aaa9e84679ed5815cea1d399210ac98c2
4141
protobuf;https://github.com/protocolbuffers/protobuf/archive/refs/tags/v21.12.zip;7cf2733949036c7d52fda017badcab093fe73bfa
4242
protoc_win64;https://github.com/protocolbuffers/protobuf/releases/download/v21.12/protoc-21.12-win64.zip;b4521f7ada5b260380f94c4bd7f1b7684c76969a
4343
protoc_win32;https://github.com/protocolbuffers/protobuf/releases/download/v21.12/protoc-21.12-win32.zip;3688010318192c46ce73213cdfb6b3e5656da874

cmake/external/onnxruntime_external_deps.cmake

+1
Original file line numberDiff line numberDiff line change
@@ -301,6 +301,7 @@ if(NOT TARGET Boost::mp11)
301301
onnxruntime_fetchcontent_declare(
302302
mp11
303303
URL ${DEP_URL_mp11}
304+
EXCLUDE_FROM_ALL
304305
FIND_PACKAGE_ARGS NAMES Boost
305306
)
306307
onnxruntime_fetchcontent_makeavailable(mp11)

onnxruntime/core/providers/openvino/ov_versions/data_ops.cc

+4
Original file line numberDiff line numberDiff line change
@@ -121,6 +121,7 @@ std::vector<SupportedOp> supported_op_mode = {
121121
{"DepthToSpace", V_2020_4, {"CPU", "GPU"}},
122122
{"DequantizeLinear", V_2021_4, {"CPU", "GPU"}},
123123
{"DequantizeLinear", V_2024_4, {"NPU"}},
124+
{"DynamicQuantizeMatMul", V_2025_0, {"CPU", "GPU"}},
124125
{"Div", V_2020_4, {"CPU", "GPU"}},
125126
{"Dropout", V_2020_4, {"CPU", "GPU"}},
126127
{"Elu", V_2020_4, {"CPU", "GPU"}},
@@ -136,6 +137,7 @@ std::vector<SupportedOp> supported_op_mode = {
136137
{"Floor", V_2020_4, {"CPU", "GPU"}},
137138
{"FusedConv", V_2023_0, {"CPU", "GPU"}},
138139
{"FusedGemm", V_2023_0, {"CPU", "GPU"}},
140+
{"FusedMatMul", V_2025_0, {"CPU", "GPU"}},
139141
{"Gather", V_2020_4, {"CPU", "GPU"}},
140142
{"GatherElements", V_2022_2, {"CPU", "GPU"}},
141143
{"GatherND", V_2021_4, {"CPU", "GPU"}},
@@ -190,6 +192,7 @@ std::vector<SupportedOp> supported_op_mode = {
190192
{"PRelu", V_2020_4, {"CPU", "GPU"}},
191193
{"QLinearMatMul", V_2022_3, {"CPU"}},
192194
{"QuantizeLinear", V_2021_4, {"CPU", "GPU"}},
195+
{"QuickGelu", V_2025_0, {"CPU", "GPU"}},
193196
{"RNN", V_2023_1, {"CPU", "GPU"}},
194197
{"RandomNormalLike", V_2023_0, {"CPU", "GPU"}},
195198
{"RandomNormalLike", V_2023_0, {"CPU", "GPU"}},
@@ -229,6 +232,7 @@ std::vector<SupportedOp> supported_op_mode = {
229232
{"Sinh", V_2020_4, {"CPU"}},
230233
{"Size", V_2022_1, {"CPU", "GPU"}},
231234
{"SkipLayerNormalization", V_2024_5, {"CPU", "GPU"}},
235+
{"SkipSimplifiedLayerNormalization", V_2025_0, {"CPU", "GPU"}},
232236
{"Slice", V_2020_4, {"CPU", "GPU"}},
233237
{"Softmax", V_2020_4, {"CPU", "GPU"}},
234238
{"Softplus", V_2022_1, {"CPU", "GPU"}},

onnxruntime/core/providers/qnn/rpcmem_library.cc

+136-23
Original file line numberDiff line numberDiff line change
@@ -2,44 +2,157 @@
22
// Licensed under the MIT License
33

44
#include "core/providers/qnn/rpcmem_library.h"
5+
6+
#if defined(_WIN32)
7+
#include <filesystem>
8+
9+
#include <sysinfoapi.h>
10+
#include <winsvc.h>
11+
#endif // defined(_WIN32)
12+
513
#include "core/providers/qnn/ort_api.h"
614

715
namespace onnxruntime::qnn {
816

17+
// Unload the dynamic library referenced by `library_handle`.
18+
// Avoid throwing because this may run from a dtor.
19+
void DynamicLibraryHandleDeleter::operator()(void* library_handle) noexcept {
20+
if (library_handle == nullptr) {
21+
return;
22+
}
23+
24+
const auto& env = GetDefaultEnv();
25+
const auto unload_status = env.UnloadDynamicLibrary(library_handle);
26+
27+
if (!unload_status.IsOK()) {
28+
LOGS_DEFAULT(WARNING) << "Failed to unload dynamic library. Error: " << unload_status.ErrorMessage();
29+
}
30+
}
31+
932
namespace {
1033

11-
const PathChar* GetRpcMemSharedLibraryPath() {
1234
#if defined(_WIN32)
13-
return ORT_TSTR("libcdsprpc.dll");
14-
#else
15-
return ORT_TSTR("libcdsprpc.so");
16-
#endif
35+
36+
struct ServiceHandleDeleter {
37+
void operator()(SC_HANDLE handle) { ::CloseServiceHandle(handle); }
38+
};
39+
40+
using UniqueServiceHandle = std::unique_ptr<std::remove_pointer_t<SC_HANDLE>, ServiceHandleDeleter>;
41+
42+
Status ReadEnvironmentVariable(const wchar_t* name, std::wstring& value_out) {
43+
const DWORD value_size = ::GetEnvironmentVariableW(name, nullptr, 0);
44+
ORT_RETURN_IF(value_size == 0,
45+
"Failed to get environment variable length. GetEnvironmentVariableW error: ", ::GetLastError());
46+
47+
std::vector<wchar_t> value(value_size);
48+
49+
ORT_RETURN_IF(::GetEnvironmentVariableW(name, value.data(), value_size) == 0,
50+
"Failed to get environment variable value. GetEnvironmentVariableW error: ", ::GetLastError());
51+
52+
value_out = std::wstring{value.data()};
53+
return Status::OK();
1754
}
1855

19-
DynamicLibraryHandle LoadDynamicLibrary(const PathString& path, bool global_symbols) {
20-
// Custom deleter to unload the shared library. Avoid throwing from it because it may run in dtor.
21-
const auto unload_library = [](void* library_handle) {
22-
if (library_handle == nullptr) {
23-
return;
24-
}
56+
Status GetServiceBinaryDirectoryPath(const wchar_t* service_name,
57+
std::filesystem::path& service_binary_directory_path_out) {
58+
SC_HANDLE scm_handle_raw = ::OpenSCManagerW(nullptr, // local computer
59+
nullptr, // SERVICES_ACTIVE_DATABASE
60+
STANDARD_RIGHTS_READ);
61+
ORT_RETURN_IF(scm_handle_raw == nullptr,
62+
"Failed to open handle to service control manager. OpenSCManagerW error: ", ::GetLastError());
63+
64+
auto scm_handle = UniqueServiceHandle{scm_handle_raw};
65+
66+
SC_HANDLE service_handle_raw = ::OpenServiceW(scm_handle.get(),
67+
service_name,
68+
SERVICE_QUERY_CONFIG);
69+
ORT_RETURN_IF(service_handle_raw == nullptr,
70+
"Failed to open service handle. OpenServiceW error: ", ::GetLastError());
71+
72+
auto service_handle = UniqueServiceHandle{service_handle_raw};
73+
74+
// get service config required buffer size
75+
DWORD service_config_buffer_size{};
76+
ORT_RETURN_IF(!::QueryServiceConfigW(service_handle.get(), nullptr, 0, &service_config_buffer_size) &&
77+
::GetLastError() != ERROR_INSUFFICIENT_BUFFER,
78+
"Failed to query service configuration buffer size. QueryServiceConfigW error: ", ::GetLastError());
2579

26-
const auto& env = GetDefaultEnv();
27-
const auto unload_status = env.UnloadDynamicLibrary(library_handle);
80+
// get the service config
81+
std::vector<std::byte> service_config_buffer(service_config_buffer_size);
82+
QUERY_SERVICE_CONFIGW* service_config = reinterpret_cast<QUERY_SERVICE_CONFIGW*>(service_config_buffer.data());
83+
ORT_RETURN_IF(!::QueryServiceConfigW(service_handle.get(), service_config, service_config_buffer_size,
84+
&service_config_buffer_size),
85+
"Failed to query service configuration. QueryServiceConfigW error: ", ::GetLastError());
2886

29-
if (!unload_status.IsOK()) {
30-
LOGS_DEFAULT(WARNING) << "Failed to unload shared library. Error: " << unload_status.ErrorMessage();
31-
}
32-
};
87+
std::wstring service_binary_path_name = service_config->lpBinaryPathName;
3388

89+
// replace system root placeholder with the value of the SYSTEMROOT environment variable
90+
const std::wstring system_root_placeholder = L"\\SystemRoot";
91+
92+
ORT_RETURN_IF(service_binary_path_name.find(system_root_placeholder, 0) != 0,
93+
"Service binary path '", ToUTF8String(service_binary_path_name),
94+
"' does not start with expected system root placeholder value '",
95+
ToUTF8String(system_root_placeholder), "'.");
96+
97+
std::wstring system_root{};
98+
ORT_RETURN_IF_ERROR(ReadEnvironmentVariable(L"SYSTEMROOT", system_root));
99+
service_binary_path_name.replace(0, system_root_placeholder.size(), system_root);
100+
101+
const auto service_binary_path = std::filesystem::path{service_binary_path_name};
102+
auto service_binary_directory_path = service_binary_path.parent_path();
103+
104+
ORT_RETURN_IF(!std::filesystem::exists(service_binary_directory_path),
105+
"Service binary directory path does not exist: ", service_binary_directory_path.string());
106+
107+
service_binary_directory_path_out = std::move(service_binary_directory_path);
108+
return Status::OK();
109+
}
110+
111+
#endif // defined(_WIN32)
112+
113+
Status GetRpcMemDynamicLibraryPath(PathString& path_out) {
114+
#if defined(_WIN32)
115+
116+
std::filesystem::path qcnspmcdm_dir_path{};
117+
ORT_RETURN_IF_ERROR(GetServiceBinaryDirectoryPath(L"qcnspmcdm", qcnspmcdm_dir_path));
118+
const auto libcdsprpc_path = qcnspmcdm_dir_path / L"libcdsprpc.dll";
119+
path_out = libcdsprpc_path.wstring();
120+
return Status::OK();
121+
122+
#else // ^^^ defined(_WIN32) / vvv !defined(_WIN32)
123+
124+
path_out = ORT_TSTR("libcdsprpc.so");
125+
return Status::OK();
126+
127+
#endif // !defined(_WIN32)
128+
}
129+
130+
Status LoadDynamicLibrary(const PathString& path, bool global_symbols,
131+
UniqueDynamicLibraryHandle& library_handle_out) {
34132
const auto& env = GetDefaultEnv();
35-
void* library_handle = nullptr;
133+
void* library_handle_raw = nullptr;
134+
ORT_RETURN_IF_ERROR(env.LoadDynamicLibrary(path, global_symbols, &library_handle_raw));
135+
136+
library_handle_out = UniqueDynamicLibraryHandle{library_handle_raw};
137+
return Status::OK();
138+
}
139+
140+
UniqueDynamicLibraryHandle GetRpcMemDynamicLibraryHandle() {
141+
std::string_view error_message_prefix = "Failed to initialize RPCMEM dynamic library handle: ";
142+
143+
PathString rpcmem_library_path{};
144+
auto status = GetRpcMemDynamicLibraryPath(rpcmem_library_path);
145+
if (!status.IsOK()) {
146+
ORT_THROW(error_message_prefix, status.ErrorMessage());
147+
}
36148

37-
const auto load_status = env.LoadDynamicLibrary(path, global_symbols, &library_handle);
38-
if (!load_status.IsOK()) {
39-
ORT_THROW("Failed to load ", ToUTF8String(path), ": ", load_status.ErrorMessage());
149+
UniqueDynamicLibraryHandle library_handle{};
150+
status = LoadDynamicLibrary(rpcmem_library_path, /* global_symbols */ false, library_handle);
151+
if (!status.IsOK()) {
152+
ORT_THROW(error_message_prefix, status.ErrorMessage());
40153
}
41154

42-
return DynamicLibraryHandle{library_handle, unload_library};
155+
return library_handle;
43156
}
44157

45158
RpcMemApi CreateApi(void* library_handle) {
@@ -58,7 +171,7 @@ RpcMemApi CreateApi(void* library_handle) {
58171
} // namespace
59172

60173
RpcMemLibrary::RpcMemLibrary()
61-
: library_handle_(LoadDynamicLibrary(GetRpcMemSharedLibraryPath(), /* global_symbols */ false)),
174+
: library_handle_(GetRpcMemDynamicLibraryHandle()),
62175
api_{CreateApi(library_handle_.get())} {
63176
}
64177

onnxruntime/core/providers/qnn/rpcmem_library.h

+6-2
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,11 @@
1010

1111
namespace onnxruntime::qnn {
1212

13-
using DynamicLibraryHandle = std::unique_ptr<void, void (*)(void*)>;
13+
struct DynamicLibraryHandleDeleter {
14+
void operator()(void* library_handle) noexcept;
15+
};
16+
17+
using UniqueDynamicLibraryHandle = std::unique_ptr<void, DynamicLibraryHandleDeleter>;
1418

1519
// This namespace contains constants and typedefs corresponding to functions from rpcmem.h.
1620
// https://github.com/quic/fastrpc/blob/v0.1.1/inc/rpcmem.h
@@ -61,7 +65,7 @@ class RpcMemLibrary {
6165
const RpcMemApi& Api() const { return api_; }
6266

6367
private:
64-
DynamicLibraryHandle library_handle_;
68+
UniqueDynamicLibraryHandle library_handle_;
6569
RpcMemApi api_;
6670
};
6771

onnxruntime/test/contrib_ops/dynamic_quantize_matmul_test.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -141,7 +141,7 @@ void TestDynamicQuantizeMatMul(bool is_matrix_b_constant,
141141
per_column, has_zp, has_bias);
142142
test.AddOutput<float>("Y", Y_dims, Y_data);
143143
test.SetOutputRelErr("Y", 0.02f);
144-
test.Run();
144+
test.Run(OpTester::ExpectResult::kExpectSuccess, "", {kOpenVINOExecutionProvider});
145145
}
146146

147147
template <typename T, bool HasZeroPoint, bool HasBias>

onnxruntime/test/contrib_ops/embed_layer_norm_op_test.cc

-4
Original file line numberDiff line numberDiff line change
@@ -158,11 +158,7 @@ static void RunTest(const embedlayernorm::OpData& data,
158158
execution_providers.push_back(DefaultDmlExecutionProvider());
159159
tester.Run(OpTester::ExpectResult::kExpectSuccess, "", {}, nullptr, &execution_providers);
160160
} else {
161-
#if defined(USE_OPENVINO)
162161
tester.Run(OpTester::ExpectResult::kExpectSuccess, "", {kOpenVINOExecutionProvider});
163-
#else
164-
tester.Run();
165-
#endif
166162
}
167163
}
168164
}

onnxruntime/test/contrib_ops/fused_matmul_op_test.cc

+2-2
Original file line numberDiff line numberDiff line change
@@ -212,8 +212,8 @@ void RunFusedMatMulTest(const char* op_name, int32_t opset_version = 7, bool tra
212212

213213
test.AddOutput<T>("Y", t.expected_dims, t.expected_vals);
214214

215-
// Disable TensorRT because of unsupported data type
216-
test.Run(OpTester::ExpectResult::kExpectSuccess, "", {kTensorrtExecutionProvider});
215+
// Disable OpenVINO, TensorRT because of unsupported data type
216+
test.Run(OpTester::ExpectResult::kExpectSuccess, "", {kTensorrtExecutionProvider, kOpenVINOExecutionProvider});
217217
}
218218
}
219219

onnxruntime/test/providers/qnn/qnn_basic_test.cc

+2-12
Original file line numberDiff line numberDiff line change
@@ -1166,18 +1166,8 @@ TEST_F(QnnHTPBackendTests, UseHtpSharedMemoryAllocatorForInputs) {
11661166
try {
11671167
qnn_ep = QnnExecutionProviderWithOptions(provider_options);
11681168
} catch (const OnnxRuntimeException& e) {
1169-
// handle particular exception that indicates that the libcdsprpc.so / dll can't be loaded
1170-
// NOTE: To run this on a local Windows ARM64 device, you need to copy libcdsprpc.dll to the build directory:
1171-
// - Open File Explorer
1172-
// - Go to C:/Windows/System32/DriverStore/FileRepository/
1173-
// - Search for a folder that begins with qcnspmcdm8380.inf_arm64_ and open it
1174-
// - Copy the libcdsprpc.dll into the build/[PATH CONTAINING onnxruntime.dll] directory of the application.
1175-
// TODO(adrianlizarraga): Update CMake build for unittests to automatically copy libcdsprpc.dll into build directory
1176-
#if defined(_WIN32)
1177-
constexpr const char* expected_error_message = "Failed to load libcdsprpc.dll";
1178-
#else
1179-
constexpr const char* expected_error_message = "Failed to load libcdsprpc.so";
1180-
#endif
1169+
// handle exception that indicates that the libcdsprpc.so / dll can't be loaded
1170+
constexpr const char* expected_error_message = "Failed to initialize RPCMEM dynamic library handle";
11811171
ASSERT_THAT(e.what(), testing::HasSubstr(expected_error_message));
11821172
GTEST_SKIP() << "HTP shared memory allocator is unavailable.";
11831173
}

onnxruntime/test/shared_lib/test_inference.cc

+2-13
Original file line numberDiff line numberDiff line change
@@ -1960,20 +1960,9 @@ static bool CreateSessionWithQnnEpAndQnnHtpSharedMemoryAllocator(PATH_TYPE model
19601960
session = Ort::Session{*ort_env, model_path, session_options};
19611961
return true;
19621962
} catch (const Ort::Exception& e) {
1963-
// handle particular exception that indicates that the libcdsprpc.so / dll can't be loaded
1964-
// NOTE: To run this on a local Windows ARM64 device, you need to copy libcdsprpc.dll to the build directory:
1965-
// - Open File Explorer
1966-
// - Go to C:/Windows/System32/DriverStore/FileRepository/
1967-
// - Search for a folder that begins with qcnspmcdm8380.inf_arm64_ and open it
1968-
// - Copy the libcdsprpc.dll into the build/[PATH CONTAINING onnxruntime.dll] directory of the application.
1969-
// TODO(adrianlizarraga): Update CMake build for unittests to automatically copy libcdsprpc.dll into build directory
1963+
// handle exception that indicates that the libcdsprpc.so / dll can't be loaded
19701964
std::string_view error_message = e.what();
1971-
1972-
#if defined(_WIN32)
1973-
std::string_view expected_error_message = "Failed to load libcdsprpc.dll";
1974-
#else
1975-
std::string_view expected_error_message = "Failed to load libcdsprpc.so";
1976-
#endif
1965+
std::string_view expected_error_message = "Failed to initialize RPCMEM dynamic library handle";
19771966

19781967
if (e.GetOrtErrorCode() == ORT_FAIL &&
19791968
error_message.find(expected_error_message) != std::string_view::npos) {

tools/ci_build/github/azure-pipelines/linux-gpu-tensorrt-daily-perf-pipeline.yml

+1-1
Original file line numberDiff line numberDiff line change
@@ -83,7 +83,7 @@ jobs:
8383

8484
- name: parser
8585
${{ if eq(parameters.UseTensorrtOssParser, true) }}:
86-
value: --use_tensorrt_oss_parser $(parameters.UseTensorrtOssParser) }}
86+
value: --use_tensorrt_oss_parser $(parameters.UseTensorrtOssParser)
8787

8888
steps:
8989
- ${{ if and(eq(parameters.TrtVersion, 'BIN'), eq(parameters.UseTensorrtOssParser, false)) }}:

0 commit comments

Comments
 (0)