We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 71d3c23 commit 129f7b9Copy full SHA for 129f7b9
dpnp/backend/extensions/lapack/orgqr.cpp
@@ -87,8 +87,17 @@ static sycl::event orgqr_impl(sycl::queue &exec_q,
87
88
sycl::event orgqr_event;
89
try {
90
+ // Release GIL to avoid serialization of host task submissions
91
+ // to the same queue in OneMKL
92
+ py::gil_scoped_release lock{};
93
+
94
scratchpad = sycl::malloc_device<T>(scratchpad_size, exec_q);
95
96
+ // mkl_lapack::orgqr() is done through GPU-to-Host reverse offload:
97
+ // exec_q.submit([&](sycl::handler& cgh) {
98
+ // cgh.depends_on(depends);
99
+ // cgh.host_task([=]() { orgqr_host(...); });
100
+ // }).wait();
101
orgqr_event = mkl_lapack::orgqr(
102
exec_q,
103
m, // The number of rows in the matrix; (0 ≤ m).
0 commit comments