Skip to content

Commit a8acdf0

Browse files
Merge pull request #1645 from IntelPython/change-signatures-to-use-queue-ref
Avoid sycl::queue copying in libtensor
2 parents 182aede + ffe13ea commit a8acdf0

File tree

3 files changed

+14
-14
lines changed

3 files changed

+14
-14
lines changed

dpctl/tensor/libtensor/include/kernels/reductions.hpp

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -2383,7 +2383,7 @@ struct CustomSearchReduction
23832383
};
23842384

23852385
typedef sycl::event (*search_strided_impl_fn_ptr)(
2386-
sycl::queue,
2386+
sycl::queue &,
23872387
size_t,
23882388
size_t,
23892389
const char *,
@@ -2507,7 +2507,7 @@ template <typename argTy,
25072507
typename ReductionOpT,
25082508
typename IndexOpT>
25092509
sycl::event search_over_group_temps_strided_impl(
2510-
sycl::queue exec_q,
2510+
sycl::queue &exec_q,
25112511
size_t iter_nelems, // number of reductions (num. of rows in a matrix
25122512
// when reducing over rows)
25132513
size_t reduction_nelems, // size of each reduction (length of rows, i.e.
@@ -2804,7 +2804,7 @@ sycl::event search_over_group_temps_strided_impl(
28042804
}
28052805

28062806
typedef sycl::event (*search_contig_impl_fn_ptr)(
2807-
sycl::queue,
2807+
sycl::queue &,
28082808
size_t,
28092809
size_t,
28102810
const char *,
@@ -2819,7 +2819,7 @@ template <typename argTy,
28192819
typename ReductionOpT,
28202820
typename IndexOpT>
28212821
sycl::event search_axis1_over_group_temps_contig_impl(
2822-
sycl::queue exec_q,
2822+
sycl::queue &exec_q,
28232823
size_t iter_nelems, // number of reductions (num. of rows in a matrix
28242824
// when reducing over rows)
28252825
size_t reduction_nelems, // size of each reduction (length of rows, i.e.
@@ -3098,7 +3098,7 @@ template <typename argTy,
30983098
typename ReductionOpT,
30993099
typename IndexOpT>
31003100
sycl::event search_axis0_over_group_temps_contig_impl(
3101-
sycl::queue exec_q,
3101+
sycl::queue &exec_q,
31023102
size_t iter_nelems, // number of reductions (num. of rows in a matrix
31033103
// when reducing over rows)
31043104
size_t reduction_nelems, // size of each reduction (length of rows, i.e.

dpctl/tensor/libtensor/source/device_support_queries.cpp

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -82,7 +82,7 @@ sycl::device _extract_device(const py::object &arg)
8282

8383
PyObject *source = arg.ptr();
8484
if (api.PySyclQueue_Check_(source)) {
85-
sycl::queue q = py::cast<sycl::queue>(arg);
85+
const sycl::queue &q = py::cast<sycl::queue>(arg);
8686
return q.get_device();
8787
}
8888
else if (api.PySyclDevice_Check_(source)) {
@@ -98,31 +98,31 @@ sycl::device _extract_device(const py::object &arg)
9898

9999
std::string default_device_fp_type(const py::object &arg)
100100
{
101-
sycl::device d = _extract_device(arg);
101+
const sycl::device &d = _extract_device(arg);
102102
return _default_device_fp_type(d);
103103
}
104104

105105
std::string default_device_int_type(const py::object &arg)
106106
{
107-
sycl::device d = _extract_device(arg);
107+
const sycl::device &d = _extract_device(arg);
108108
return _default_device_int_type(d);
109109
}
110110

111111
std::string default_device_bool_type(const py::object &arg)
112112
{
113-
sycl::device d = _extract_device(arg);
113+
const sycl::device &d = _extract_device(arg);
114114
return _default_device_bool_type(d);
115115
}
116116

117117
std::string default_device_complex_type(const py::object &arg)
118118
{
119-
sycl::device d = _extract_device(arg);
119+
const sycl::device &d = _extract_device(arg);
120120
return _default_device_complex_type(d);
121121
}
122122

123123
std::string default_device_index_type(const py::object &arg)
124124
{
125-
sycl::device d = _extract_device(arg);
125+
const sycl::device &d = _extract_device(arg);
126126
return _default_device_index_type(d);
127127
}
128128

dpctl/tensor/libtensor/source/elementwise_functions/elementwise_functions.hpp

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -63,7 +63,7 @@ template <typename output_typesT,
6363
std::pair<sycl::event, sycl::event>
6464
py_unary_ufunc(const dpctl::tensor::usm_ndarray &src,
6565
const dpctl::tensor::usm_ndarray &dst,
66-
sycl::queue q,
66+
sycl::queue &q,
6767
const std::vector<sycl::event> &depends,
6868
//
6969
const output_typesT &output_type_vec,
@@ -301,7 +301,7 @@ std::pair<sycl::event, sycl::event> py_binary_ufunc(
301301
const dpctl::tensor::usm_ndarray &src1,
302302
const dpctl::tensor::usm_ndarray &src2,
303303
const dpctl::tensor::usm_ndarray &dst, // dst = op(src1, src2), elementwise
304-
sycl::queue exec_q,
304+
sycl::queue &exec_q,
305305
const std::vector<sycl::event> depends,
306306
//
307307
const output_typesT &output_type_table,
@@ -622,7 +622,7 @@ template <typename output_typesT,
622622
std::pair<sycl::event, sycl::event>
623623
py_binary_inplace_ufunc(const dpctl::tensor::usm_ndarray &lhs,
624624
const dpctl::tensor::usm_ndarray &rhs,
625-
sycl::queue exec_q,
625+
sycl::queue &exec_q,
626626
const std::vector<sycl::event> depends,
627627
//
628628
const output_typesT &output_type_table,

0 commit comments

Comments
 (0)