IntelPython
diff --git a/‎dpctl/tensor/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎dpctl/tensor/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
diff --git a/‎dpctl/tensor/__init__.py
Lines changed: 3 additions & 0 deletions b/‎dpctl/tensor/__init__.py
Lines changed: 3 additions & 0 deletions
diff --git a/‎dpctl/tensor/_copy_utils.py
Lines changed: 42 additions & 15 deletions b/‎dpctl/tensor/_copy_utils.py
Lines changed: 42 additions & 15 deletions
diff --git a/‎dpctl/tensor/_indexing_functions.py
Lines changed: 171 additions & 0 deletions b/‎dpctl/tensor/_indexing_functions.py
Lines changed: 171 additions & 0 deletions
@@ -23,6 +23,7 @@ pybind11_add_module(${python_module_name} MODULE
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/copy_numpy_ndarray_into_usm_ndarray.cpp
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/copy_for_reshape.cpp
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/linear_sequences.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/advanced_indexing.cpp
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/eye_ctor.cpp
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/full_ctor.cpp
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/triul_ctor.cpp
 
@@ -58,6 +58,7 @@
 )
 from dpctl.tensor._device import Device
 from dpctl.tensor._dlpack import from_dlpack
+from dpctl.tensor._indexing_functions import put, take
 from dpctl.tensor._manipulation_functions import (
     broadcast_arrays,
     broadcast_to,
@@ -112,6 +113,8 @@
     "expand_dims",
     "permute_dims",
     "squeeze",
+    "take",
+    "put",
     "from_numpy",
     "to_numpy",
     "asnumpy",
 
@@ -13,7 +13,10 @@
 #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
+import operator
+
 import numpy as np
+from numpy.core.numeric import normalize_axis_index
 
 import dpctl
 import dpctl.memory as dpm
@@ -449,14 +452,25 @@ def _mock_take_multi_index(ary, inds, p):
         raise IndexError(
             "arrays used as indices must be of integer (or boolean) type"
         )
-    ary_np = dpt.asnumpy(ary)
-    ind_np = (slice(None),) * p + tuple(dpt.asnumpy(ind) for ind in inds)
-    res_np = ary_np[ind_np]
+    inds = dpt.broadcast_arrays(*inds)
+    ary_ndim = ary.ndim
+    if ary_ndim > 0:
+        p = operator.index(p)
+        p = normalize_axis_index(p, ary_ndim)
+
+        res_shape = ary.shape[:p] + inds[0].shape + ary.shape[p + len(inds) :]
+    else:
+        res_shape = inds[0].shape
     res_usm_type = dpctl.utils.get_coerced_usm_type(usm_types_)
     res = dpt.empty(
-        res_np.shape, dtype=ary.dtype, usm_type=res_usm_type, sycl_queue=exec_q
+        res_shape, dtype=ary.dtype, usm_type=res_usm_type, sycl_queue=exec_q
     )
-    res[...] = res_np
+
+    hev, _ = ti._take(
+        src=ary, ind=inds, dst=res, axis_start=p, mode=0, sycl_queue=exec_q
+    )
+    hev.wait()
+
     return res
 
 
@@ -492,7 +506,7 @@ def _mock_place(ary, ary_mask, p, vals):
 
 
 def _mock_put_multi_index(ary, inds, p, vals):
-    if isinstance(vals, dpt.ums_ndarray):
+    if isinstance(vals, dpt.usm_ndarray):
         queues_ = [ary.sycl_queue, vals.sycl_queue]
         usm_types_ = [ary.usm_type, vals.usm_type]
     else:
@@ -522,14 +536,27 @@ def _mock_put_multi_index(ary, inds, p, vals):
         raise IndexError(
             "arrays used as indices must be of integer (or boolean) type"
         )
-    ary_np = dpt.asnumpy(ary)
-    if isinstance(vals, dpt.usm_ndarray) or hasattr(
-        vals, "__sycl_usm_array_interface__"
-    ):
-        vals_np = dpt.asnumpy(vals)
+
+    inds = dpt.broadcast_arrays(*inds)
+    ary_ndim = ary.ndim
+    if ary_ndim > 0:
+        p = operator.index(p)
+        p = normalize_axis_index(p, ary_ndim)
+        vals_shape = ary.shape[:p] + inds[0].shape + ary.shape[p + len(inds) :]
     else:
-        vals_np = vals
-    ind_np = (slice(None),) * p + tuple(dpt.asnumpy(ind) for ind in inds)
-    ary_np[ind_np] = vals_np
-    ary[...] = ary_np
+        vals_shape = inds[0].shape
+
+    vals_usm_type = dpctl.utils.get_coerced_usm_type(usm_types_)
+    if not isinstance(vals, dpt.usm_ndarray):
+        vals = dpt.asarray(
+            vals, ary.dtype, usm_type=vals_usm_type, sycl_queue=exec_q
+        )
+
+    vals = dpt.broadcast_to(vals, vals_shape)
+
+    hev, _ = ti._put(
+        dst=ary, ind=inds, val=vals, axis_start=p, mode=0, sycl_queue=exec_q
+    )
+    hev.wait()
+
     return
@@ -0,0 +1,171 @@
+#                       Data Parallel Control (dpctl)
+#
+#  Copyright 2020-2022 Intel Corporation
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import operator
+
+import numpy as np
+from numpy.core.numeric import normalize_axis_index
+
+import dpctl
+import dpctl.tensor as dpt
+from dpctl.tensor._tensor_impl import _put, _take
+
+
+def take(x, indices, /, *, axis=None, mode="clip"):
+    if not isinstance(x, dpt.usm_ndarray):
+        raise TypeError(
+            "Expected instance of `dpt.usm_ndarray`, got `{}`.".format(type(x))
+        )
+
+    if not isinstance(indices, list) and not isinstance(indices, tuple):
+        indices = (indices,)
+
+    queues_ = [
+        x.sycl_queue,
+    ]
+    usm_types_ = [
+        x.usm_type,
+    ]
+
+    for i in indices:
+        if not isinstance(i, dpt.usm_ndarray):
+            raise TypeError(
+                "`indices` expected `dpt.usm_ndarray`, got `{}`.".format(
+                    type(i)
+                )
+            )
+        if not np.issubdtype(i.dtype, np.integer):
+            raise TypeError(
+                "`indices` expected integer data type, got `{}`".format(i.dtype)
+            )
+        queues_.append(i.sycl_queue)
+        usm_types_.append(i.usm_type)
+    exec_q = dpctl.utils.get_execution_queue(queues_)
+    if exec_q is None:
+        raise dpctl.utils.ExecutionPlacementError(
+            "Can not automatically determine where to allocate the "
+            "result or performance execution. "
+            "Use `usm_ndarray.to_device` method to migrate data to "
+            "be associated with the same queue."
+        )
+    res_usm_type = dpctl.utils.get_coerced_usm_type(usm_types_)
+
+    modes = {"clip": 0, "wrap": 1}
+    try:
+        mode = modes[mode]
+    except KeyError:
+        raise ValueError("`mode` must be `clip` or `wrap`.")
+
+    x_ndim = x.ndim
+    if axis is None:
+        if x_ndim > 1:
+            raise ValueError(
+                "`axis` cannot be `None` for array of dimension `{}`".format(
+                    x_ndim
+                )
+            )
+        axis = 0
+
+    indices = dpt.broadcast_arrays(*indices)
+    if x_ndim > 0:
+        axis = operator.index(axis)
+        axis = normalize_axis_index(axis, x_ndim)
+        res_shape = (
+            x.shape[:axis] + indices[0].shape + x.shape[axis + len(indices) :]
+        )
+    else:
+        res_shape = indices[0].shape
+
+    res = dpt.empty(
+        res_shape, dtype=x.dtype, usm_type=res_usm_type, sycl_queue=exec_q
+    )
+
+    hev, _ = _take(x, indices, res, axis, mode, sycl_queue=exec_q)
+    hev.wait()
+
+    return res
+
+
+def put(x, indices, vals, /, *, axis=None, mode="clip"):
+    if not isinstance(x, dpt.usm_ndarray):
+        raise TypeError(
+            "Expected instance of `dpt.usm_ndarray`, got `{}`.".format(type(x))
+        )
+    queues_ = [
+        x.sycl_queue,
+    ]
+    usm_types_ = [
+        x.usm_type,
+    ]
+
+    if not isinstance(indices, list) and not isinstance(indices, tuple):
+        indices = (indices,)
+
+    for i in indices:
+        if not isinstance(i, dpt.usm_ndarray):
+            raise TypeError(
+                "`indices` expected `dpt.usm_ndarray`, got `{}`.".format(
+                    type(i)
+                )
+            )
+        if not np.issubdtype(i.dtype, np.integer):
+            raise TypeError(
+                "`indices` expected integer data type, got `{}`".format(i.dtype)
+            )
+        queues_.append(i.sycl_queue)
+        usm_types_.append(i.usm_type)
+    exec_q = dpctl.utils.get_execution_queue(queues_)
+    if exec_q is None:
+        raise dpctl.utils.ExecutionPlacementError(
+            "Can not automatically determine where to allocate the "
+            "result or performance execution. "
+            "Use `usm_ndarray.to_device` method to migrate data to "
+            "be associated with the same queue."
+        )
+    val_usm_type = dpctl.utils.get_coerced_usm_type(usm_types_)
+
+    modes = {"clip": 0, "wrap": 1}
+    try:
+        mode = modes[mode]
+    except KeyError:
+        raise ValueError("`mode` must be `wrap`, or `clip`.")
+
+    # when axis is none, array is treated as 1D
+    if axis is None:
+        x = dpt.reshape(x, (x.size,), copy=False)
+        axis = 0
+
+    indices = dpt.broadcast_arrays(*indices)
+    x_ndim = x.ndim
+    if x_ndim > 0:
+        axis = operator.index(axis)
+        axis = normalize_axis_index(axis, x_ndim)
+
+        val_shape = (
+            x.shape[:axis] + indices[0].shape + x.shape[axis + len(indices) :]
+        )
+    else:
+        val_shape = indices[0].shape
+
+    if not isinstance(vals, dpt.usm_ndarray):
+        vals = dpt.asarray(
+            vals, dtype=x.dtype, usm_type=val_usm_type, sycl_queue=exec_q
+        )
+
+    vals = dpt.broadcast_to(vals, val_shape)
+
+    hev, _ = _put(x, indices, vals, axis, mode, sycl_queue=exec_q)
+    hev.wait()