Skip to content

Commit

Permalink
Align with changes in dpctl::tensor::offset_utils::device_allocate_an…
Browse files Browse the repository at this point in the history
…d_pack
  • Loading branch information
antonwolfy committed Jan 10, 2025
1 parent 23c4907 commit 49f957b
Showing 1 changed file with 12 additions and 21 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -218,15 +218,12 @@ std::pair<sycl::event, sycl::event>
std::vector<sycl::event> host_tasks{};
host_tasks.reserve(2);

const auto &ptr_size_event_triple_ = device_allocate_and_pack<py::ssize_t>(
auto ptr_size_event_triple_ = device_allocate_and_pack<py::ssize_t>(
q, host_tasks, simplified_shape, simplified_src_strides,
simplified_dst_strides);
py::ssize_t *shape_strides = std::get<0>(ptr_size_event_triple_);
const sycl::event &copy_shape_ev = std::get<2>(ptr_size_event_triple_);

if (shape_strides == nullptr) {
throw std::runtime_error("Device memory allocation failed");
}
auto shape_strides_owner = std::move(std::get<0>(ptr_size_event_triple_));
const auto &copy_shape_ev = std::get<2>(ptr_size_event_triple_);
const py::ssize_t *shape_strides = shape_strides_owner.get();

sycl::event strided_fn_ev =
strided_fn(q, src_nelems, nd, shape_strides, src_data, src_offset,
Expand Down Expand Up @@ -543,16 +540,13 @@ std::pair<sycl::event, sycl::event> py_binary_ufunc(
}

using dpctl::tensor::offset_utils::device_allocate_and_pack;
const auto &ptr_sz_event_triple_ = device_allocate_and_pack<py::ssize_t>(
auto ptr_sz_event_triple_ = device_allocate_and_pack<py::ssize_t>(
exec_q, host_tasks, simplified_shape, simplified_src1_strides,
simplified_src2_strides, simplified_dst_strides);
auto shape_strides_owner = std::move(std::get<0>(ptr_sz_event_triple_));
auto &copy_shape_ev = std::get<2>(ptr_sz_event_triple_);

py::ssize_t *shape_strides = std::get<0>(ptr_sz_event_triple_);
const sycl::event &copy_shape_ev = std::get<2>(ptr_sz_event_triple_);

if (shape_strides == nullptr) {
throw std::runtime_error("Unable to allocate device memory");
}
const py::ssize_t *shape_strides = shape_strides_owner.get();

sycl::event strided_fn_ev = strided_fn(
exec_q, src_nelems, nd, shape_strides, src1_data, src1_offset,
Expand Down Expand Up @@ -796,16 +790,13 @@ std::pair<sycl::event, sycl::event>
}

using dpctl::tensor::offset_utils::device_allocate_and_pack;
const auto &ptr_sz_event_triple_ = device_allocate_and_pack<py::ssize_t>(
auto ptr_sz_event_triple_ = device_allocate_and_pack<py::ssize_t>(
exec_q, host_tasks, simplified_shape, simplified_rhs_strides,
simplified_lhs_strides);
auto shape_strides_owner = std::move(std::get<0>(ptr_sz_event_triple_));
auto copy_shape_ev = std::get<2>(ptr_sz_event_triple_);

py::ssize_t *shape_strides = std::get<0>(ptr_sz_event_triple_);
const sycl::event &copy_shape_ev = std::get<2>(ptr_sz_event_triple_);

if (shape_strides == nullptr) {
throw std::runtime_error("Unable to allocate device memory");
}
const py::ssize_t *shape_strides = shape_strides_owner.get();

sycl::event strided_fn_ev =
strided_fn(exec_q, rhs_nelems, nd, shape_strides, rhs_data, rhs_offset,
Expand Down

0 comments on commit 49f957b

Please sign in to comment.