IntelPython
diff --git a/‎README.md
Lines changed: 2 additions & 2 deletions b/‎README.md
Lines changed: 2 additions & 2 deletions
diff --git a/‎doc/conf.py
Lines changed: 1 addition & 1 deletion b/‎doc/conf.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎dpnp/backend/CMakeLists.txt
Lines changed: 4 additions & 1 deletion b/‎dpnp/backend/CMakeLists.txt
Lines changed: 4 additions & 1 deletion
diff --git a/‎dpnp/backend/doc/Doxyfile
Lines changed: 1 addition & 1 deletion b/‎dpnp/backend/doc/Doxyfile
Lines changed: 1 addition & 1 deletion
diff --git a/‎dpnp/backend/examples/example3.cpp
Lines changed: 1 addition & 1 deletion b/‎dpnp/backend/examples/example3.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎dpnp/backend/examples/example_bs.cpp
Lines changed: 192 additions & 0 deletions b/‎dpnp/backend/examples/example_bs.cpp
Lines changed: 192 additions & 0 deletions
diff --git a/‎dpnp/backend/include/dpnp_iface.hpp
Lines changed: 58 additions & 9 deletions b/‎dpnp/backend/include/dpnp_iface.hpp
Lines changed: 58 additions & 9 deletions
@@ -37,7 +37,7 @@ python -m unittest tests/test_mixins.py
 
 ## Run numpy external test
 ```bash
-. ./0.env
+. ./0.env.sh
 python -m tests.third_party.numpy_ext
 # or
 python -m tests.third_party.numpy_ext core/tests/test_umath.py
@@ -57,7 +57,7 @@ Building:
 
 ## Packaging:
 ```bash
-. ./0.env
+. ./0.env.sh
 conda-build conda-recipe/
 ```
 
 
@@ -33,7 +33,7 @@
 # The short X.Y version
 version = '0.5'
 # The full version, including alpha/beta/rc tags
-release = '0.5.0'
+release = '0.5.1'
 
 
 # -- General configuration ---------------------------------------------------
 
@@ -27,7 +27,7 @@
 
 cmake_minimum_required(VERSION 3.10 FATAL_ERROR)
 
-# set(DPNP_VERSION 0.5.0)
+# set(DPNP_VERSION 0.5.1)
 # set(DPNP_API_VERSION 0.5)
 
 # set directory where the custom finders live
@@ -57,6 +57,7 @@ option(DPNP_BACKEND_TESTS "Enable DPNP tests" FALSE)
 message(STATUS "CMAKE_VERSION:                   ${CMAKE_VERSION}")
 message(STATUS "CMAKE_GENERATOR:                 ${CMAKE_GENERATOR}")
 message(STATUS "CMAKE_HOST_SYSTEM_NAME:          ${CMAKE_HOST_SYSTEM_NAME}")
+message(STATUS "========== User controlled variables list ==========")
 message(STATUS "DPNP_ONEAPI_ROOT:                ${DPNP_ONEAPI_ROOT}")
 message(STATUS "DPNP_STATIC_LIB_ENABLE:          ${DPNP_STATIC_LIB_ENABLE}")
 message(STATUS "DPNP_DEBUG_ENABLE:               ${DPNP_DEBUG_ENABLE}")
@@ -65,6 +66,7 @@ message(STATUS "DPNP_INSTALL_STRUCTURED:         ${DPNP_INSTALL_STRUCTURED}")
 message(STATUS "DPNP_SYCL_QUEUE_MGR_ENABLE:      ${DPNP_SYCL_QUEUE_MGR_ENABLE}")
 message(STATUS " |- DPNP_QUEUEMGR_INCLUDE_DIR:   ${DPNP_QUEUEMGR_INCLUDE_DIR}")
 message(STATUS " |- DPNP_QUEUEMGR_LIB_DIR:       ${DPNP_QUEUEMGR_LIB_DIR}")
+message(STATUS "======= End of user controlled variables list ======")
 
 # -----------------------------------------------------------------------------------------------
 # Compiler-specific logic...
@@ -162,6 +164,7 @@ project(dpnp_project
 # Building logic...
 # -----------------------------------------------------------------------------------------------
 set(DPNP_SRC
+    kernels/dpnp_krnl_arraycreation.cpp
     kernels/dpnp_krnl_bitwise.cpp
     kernels/dpnp_krnl_common.cpp
     kernels/dpnp_krnl_elemwise.cpp
 
@@ -38,7 +38,7 @@ PROJECT_NAME           = "DPNP C++ backend kernel library"
 # could be handy for archiving the generated documentation or if some version
 # control system is used.
 
-PROJECT_NUMBER         = 0.5.0
+PROJECT_NUMBER         = 0.5.1
 
 # Using the PROJECT_BRIEF tag one can provide an optional one line description
 # for a project that appears at the top of each page and should give viewer a
 
@@ -42,7 +42,7 @@ int main(int, char**)
 {
     const size_t size = 256;
 
-    dpnp_queue_initialize_c(QueueOptions::CPU_SELECTOR);
+    dpnp_queue_initialize_c();
     std::cout << "SYCL queue is CPU: " << dpnp_queue_is_cpu_c() << std::endl;
 
     int* array1 = (int*)dpnp_memory_alloc_c(size * sizeof(int));
 
@@ -0,0 +1,192 @@
+//*****************************************************************************
+// Copyright (c) 2016-2020, Intel Corporation
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// - Redistributions of source code must retain the above copyright notice,
+//   this list of conditions and the following disclaimer.
+// - Redistributions in binary form must reproduce the above copyright notice,
+//   this list of conditions and the following disclaimer in the documentation
+//   and/or other materials provided with the distribution.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
+// THE POSSIBILITY OF SUCH DAMAGE.
+//*****************************************************************************
+
+/**
+ * Example BS.
+ *
+ * This example shows simple usage of the DPNP C++ Backend library
+ * to calculate black scholes algorithm like in Python version
+ *
+ * Possible compile line:
+ * clang++ -g -fPIC dpnp/backend/examples/example_bs.cpp -Idpnp -Idpnp/backend/include -Ldpnp -Wl,-rpath='$ORIGIN'/dpnp -ldpnp_backend_c -o example_bs
+ *
+ */
+
+#include <iostream>
+#include <cmath>
+
+#include "dpnp_iface.hpp"
+
+double* black_scholes_put(double* S, double* K, double* T, double* sigmas, double* r_sigma_sigma_2,
+                          double* nrs, double* sqrt2, double* ones, double* twos, const size_t size)
+{
+    double* d1 = (double*)dpnp_memory_alloc_c(size * sizeof(double));
+    dpnp_divide_c<double, double, double>(S, K, d1, size);         // S/K
+    dpnp_log_c<double, double>(d1, d1, size);               // np.log(S/K)
+
+    double* bs_put = (double*)dpnp_memory_alloc_c(size * sizeof(double));
+    dpnp_multiply_c<double, double, double>(r_sigma_sigma_2, T, bs_put, size);  // r_sigma_sigma_2*T
+    dpnp_add_c<double, double, double>(d1, bs_put, d1, size);     // np.log(S/K) + r_sigma_sigma_2*T
+
+    dpnp_sqrt_c<double, double>(T, bs_put, size);                                  // np.sqrt(T)
+    dpnp_multiply_c<double, double, double>(sigmas, bs_put, bs_put, size);  // sigmas*np.sqrt(T)
+
+    // (np.log(S/K) + r_sigma_sigma_2*T) / (sigmas*np.sqrt(T))
+    dpnp_divide_c<double, double, double>(d1, bs_put, d1, size);
+
+    double* d2 = (double*)dpnp_memory_alloc_c(size * sizeof(double));
+    dpnp_sqrt_c<double, double>(T, bs_put, size);                                  // np.sqrt(T)
+    dpnp_multiply_c<double, double, double>(sigmas, bs_put, bs_put, size);  // sigmas*np.sqrt(T)
+    dpnp_subtract_c<double, double, double>(d1, bs_put, d2, size);     // d1 - sigmas*np.sqrt(T)
+
+    double* cdf_d1 = (double*)dpnp_memory_alloc_c(size * sizeof(double));
+    dpnp_divide_c<double, double, double>(d1, sqrt2, cdf_d1, size);                 // d1 / sqrt2
+    dpnp_erf_c<double>(cdf_d1, cdf_d1, size);                                // np.erf(d1 / sqrt2)
+    dpnp_add_c<double, double, double>(ones, cdf_d1, cdf_d1, size);   // ones + np.erf(d1 / sqrt2)
+    dpnp_add_c<double, double, double>(ones, cdf_d1, cdf_d1, size);  // (ones + np.erf(d1 / sqrt2)) / twos
+    dpnp_memory_free_c(d1);
+
+    double* cdf_d2 = (double*)dpnp_memory_alloc_c(size * sizeof(double));
+    dpnp_divide_c<double, double, double>(d2, sqrt2, cdf_d2, size);                 // d2 / sqrt2
+    dpnp_erf_c<double>(cdf_d2, cdf_d2, size);                                // np.erf(d2 / sqrt2)
+    dpnp_add_c<double, double, double>(ones, cdf_d2, cdf_d2, size);   // ones + np.erf(d2 / sqrt2)
+    dpnp_add_c<double, double, double>(ones, cdf_d2, cdf_d2, size);  // (ones + np.erf(d2 / sqrt2)) / twos
+    dpnp_memory_free_c(d2);
+
+    double* bs_call = (double*)dpnp_memory_alloc_c(size * sizeof(double));
+    dpnp_multiply_c<double, double, double>(S, cdf_d1, bs_call, size);  // S*cdf_d1
+    dpnp_memory_free_c(cdf_d1);
+
+    dpnp_multiply_c<double, double, double>(nrs, T, bs_put, size);            // nrs*T
+    dpnp_exp_c<double, double>(bs_put, bs_put, size);                    // np.exp(nrs*T)
+    dpnp_multiply_c<double, double, double>(K, bs_put, bs_put, size);  // K*np.exp(nrs*T)
+
+    // K*np.exp(nrs*T)*cdf_d2
+    dpnp_multiply_c<double, double, double>(bs_put, cdf_d2, bs_put, size);
+    dpnp_memory_free_c(cdf_d2);
+
+    // S*cdf_d1 - K*np.exp(nrs*T)*cdf_d2
+    dpnp_subtract_c<double, double, double>(bs_call, bs_put, bs_call, size);
+
+    dpnp_multiply_c<double, double, double>(nrs, T, bs_put, size);               // nrs*T
+    dpnp_exp_c<double, double>(bs_put, bs_put, size);                     // np.exp(nrs*T)
+    dpnp_multiply_c<double, double, double>(K, bs_put, bs_put, size);   // K*np.exp(nrs*T)
+    dpnp_subtract_c<double, double, double>(bs_put, S, bs_put, size);   // K*np.exp(nrs*T) - S
+    dpnp_add_c<double, double, double>(bs_put, bs_call, bs_put, size);  // K*np.exp(nrs*T) - S + bs_call
+    dpnp_memory_free_c(bs_call);
+
+    return bs_put;
+}
+
+int main(int, char**)
+{
+    const size_t SIZE = 256;
+
+    const size_t SEED = 7777777;
+    const long SL = 10, SH = 50;
+    const long KL = 10, KH = 50;
+    const long TL = 1,  TH = 2;
+    const double RISK_FREE = 0.1;
+    const double VOLATILITY = 0.2;
+
+    dpnp_queue_initialize_c(QueueOptions::GPU_SELECTOR);
+    std::cout << "SYCL queue is CPU: " << dpnp_queue_is_cpu_c() << std::endl;
+
+    double* S = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+    double* K = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+    double* T = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+
+    dpnp_rng_srand_c(SEED);
+    dpnp_rng_uniform_c<double>(S, SL, SH, SIZE);  // np.random.uniform(SL, SH, SIZE)
+    dpnp_rng_uniform_c<double>(K, KL, KH, SIZE);  // np.random.uniform(KL, KH, SIZE)
+    dpnp_rng_uniform_c<double>(T, TL, TH, SIZE);  // np.random.uniform(TL, TH, SIZE)
+
+    double* r = (double*)dpnp_memory_alloc_c(1 * sizeof(double));
+    r[0] = RISK_FREE;
+
+    double* sigma = (double*)dpnp_memory_alloc_c(1 * sizeof(double));
+    sigma[0] = VOLATILITY;
+
+    double* rss2 = (double*)dpnp_memory_alloc_c(1 * sizeof(double));
+    rss2[0] = RISK_FREE + VOLATILITY*VOLATILITY/2.;
+
+    double* nr = (double*)dpnp_memory_alloc_c(1 * sizeof(double));
+    nr[0] = -RISK_FREE;
+
+    double* sq2 = (double*)dpnp_memory_alloc_c(1 * sizeof(double));
+    sq2[0] = sqrt(2.);
+
+    double* one = (double*)dpnp_memory_alloc_c(1 * sizeof(double));
+    one[0] = 1.;
+
+    double* two = (double*)dpnp_memory_alloc_c(1 * sizeof(double));
+    two[0] = 2.;
+
+    double* sigmas = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+    double* r_sigma_sigma_2 = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+    double* nrs = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+    double* sqrt2 = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+    double* ones = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+    double* twos = (double*)dpnp_memory_alloc_c(SIZE * sizeof(double));
+
+    dpnp_full_c<double>(sigma, sigmas, SIZE);          // np.full((SIZE,), sigma, dtype=DTYPE)
+    dpnp_full_c<double>(rss2, r_sigma_sigma_2, SIZE);  // np.full((SIZE,), r + sigma*sigma/2., dtype=DTYPE)
+    dpnp_full_c<double>(nr, nrs, SIZE);                // np.full((SIZE,), -r, dtype=DTYPE)
+    dpnp_full_c<double>(sq2, sqrt2, SIZE);             // np.full((SIZE,), np.sqrt(2), dtype=DTYPE)
+    dpnp_full_c<double>(one, ones, SIZE);              // np.full((SIZE,), 1, dtype=DTYPE)
+    dpnp_full_c<double>(two, twos, SIZE);              // np.full((SIZE,), 2, dtype=DTYPE)
+
+    dpnp_memory_free_c(one);
+    dpnp_memory_free_c(two);
+    dpnp_memory_free_c(sq2);
+    dpnp_memory_free_c(nr);
+    dpnp_memory_free_c(rss2);
+    dpnp_memory_free_c(sigma);
+    dpnp_memory_free_c(r);
+
+    double* bs_put = black_scholes_put(S, K, T, sigmas, r_sigma_sigma_2, nrs, sqrt2, ones, twos, SIZE);
+
+    std::cout << std::endl;
+    for (size_t i = 0; i < 10; ++i)
+    {
+        std::cout << bs_put[i] << ", ";
+    }
+    std::cout << std::endl;
+
+    dpnp_memory_free_c(bs_put);
+
+    dpnp_memory_free_c(twos);
+    dpnp_memory_free_c(ones);
+    dpnp_memory_free_c(sqrt2);
+    dpnp_memory_free_c(nrs);
+    dpnp_memory_free_c(r_sigma_sigma_2);
+    dpnp_memory_free_c(sigmas);
+
+    dpnp_memory_free_c(T);
+    dpnp_memory_free_c(K);
+    dpnp_memory_free_c(S);
+
+    return 0;
+}
@@ -68,7 +68,8 @@
 enum class QueueOptions : uint32_t
 {
     CPU_SELECTOR, /**< CPU side execution mode */
-    GPU_SELECTOR  /**< Intel GPU side execution mode */
+    GPU_SELECTOR, /**< Intel GPU side execution mode */
+    AUTO_SELECTOR /**< Automatic selection based on environment variable with @ref CPU_SELECTOR default */
 };
 
 /**
@@ -77,9 +78,9 @@ enum class QueueOptions : uint32_t
  *
  * Global SYCL queue initialization.
  *
- * @param [in]  selector       Select type @ref QueueOptions of the SYCL queue.
+ * @param [in]  selector       Select type @ref QueueOptions of the SYCL queue. Default @ref AUTO_SELECTOR
  */
-INP_DLLEXPORT void dpnp_queue_initialize_c(QueueOptions selector);
+INP_DLLEXPORT void dpnp_queue_initialize_c(QueueOptions selector = QueueOptions::AUTO_SELECTOR);
 
 /**
  * @ingroup BACKEND_API
@@ -118,6 +119,17 @@ void dpnp_memory_memcpy_c(void* dst, const void* src, size_t size_in_bytes);
 template <typename _DataType>
 INP_DLLEXPORT void dpnp_arange_c(size_t start, size_t step, void* result1, size_t size);
 
+/**
+ * @ingroup BACKEND_API
+ * @brief Implementation of full function
+ *
+ * @param [in]  array_in  Input one-element array.
+ * @param [out] result    Output array.
+ * @param [in]  size      Number of elements in the output array.
+ */
+template <typename _DataType>
+INP_DLLEXPORT void dpnp_full_c(void* array_in, void* result, const size_t size);
+
 /**
  * @ingroup BACKEND_API
  * @brief Matrix multiplication.
@@ -169,6 +181,30 @@ INP_DLLEXPORT void dpnp_dot_c(void* array1, void* array2, void* result1, size_t
 template <typename _DataType_input1, typename _DataType_input2, typename _DataType_output>
 INP_DLLEXPORT void dpnp_cross_c(void* array1_in, void* array2_in, void* result1, size_t size);
 
+/**
+ * @ingroup BACKEND_API
+ * @brief Custom implementation of cumprod function
+ *
+ * @param [in]  array1_in  Input array.
+ * @param [out] result1    Output array.
+ * @param [in]  size       Number of elements in input arrays.
+ *
+ */
+template <typename _DataType_input, typename _DataType_output>
+INP_DLLEXPORT void dpnp_cumprod_c(void* array1_in, void* result1, size_t size);
+
+/**
+ * @ingroup BACKEND_API
+ * @brief Custom implementation of cumsum function
+ *
+ * @param [in]  array1_in  Input array.
+ * @param [out] result1    Output array.
+ * @param [in]  size       Number of elements in input arrays.
+ *
+ */
+template <typename _DataType_input, typename _DataType_output>
+INP_DLLEXPORT void dpnp_cumsum_c(void* array1_in, void* result1, size_t size);
+
 /**
  * @ingroup BACKEND_API
  * @brief Sum of array elements
@@ -284,6 +320,17 @@ INP_DLLEXPORT void dpnp_cov_c(void* array1_in, void* result1, size_t nrows, size
 template <typename _DataType>
 INP_DLLEXPORT void dpnp_det_c(void* array1_in, void* result1, size_t* shape, size_t ndim);
 
+/**
+ * @ingroup BACKEND_API
+ * @brief implementation of creating filled with value array function
+ *
+ * @param [out] result  Output array.
+ * @param [in]  value   Value in array.
+ * @param [in]  size    Number of elements in array.
+ */
+template <typename _DataType>
+INP_DLLEXPORT void dpnp_initval_c(void* result1, void* value, size_t size);
+
 /**
  * @ingroup BACKEND_API
  * @brief math library implementation of inv function
@@ -411,11 +458,11 @@ INP_DLLEXPORT void dpnp_std_c(
  * @brief math library implementation of take function
  *
  * @param [in]  array   Input array with data.
- * @param [in]  array   Input array with indices.
- * @param [out] result  Output array with indeces.
+ * @param [in]  indices Input array with indices.
+ * @param [out] result  Output array.
  * @param [in]  size    Number of elements in the input array.
  */
-template <typename _DataType>
+template <typename _DataType, typename _IndecesType>
 INP_DLLEXPORT void dpnp_take_c(void* array, void* indices, void* result, size_t size);
 
 /**
@@ -513,14 +560,16 @@ INP_DLLEXPORT void dpnp_remainder_c(void* array1_in, void* array2_in, void* resu
  * @param [in]  input_shape  Input shape.
  * @param [in]  result_shape Output shape.
  * @param [in]  permute_axes Order of axis by it's id as it should be presented in output.
+ * @param [in]  ndim         Number of elements in shapes and axes.
  * @param [out] result1      Output array.
  * @param [in]  size         Number of elements in input arrays.
  */
 template <typename _DataType>
 INP_DLLEXPORT void dpnp_elemwise_transpose_c(void* array1_in,
-                                             const std::vector<long>& input_shape,
-                                             const std::vector<long>& result_shape,
-                                             const std::vector<long>& permute_axes,
+                                             const size_t* input_shape,
+                                             const size_t* result_shape,
+                                             const size_t* permute_axes,
+                                             size_t ndim,
                                              void* result1,
                                              size_t size);
Original file line number	Diff line number	Diff line change
`@@ -42,7 +42,7 @@ int main(int, char**)`
`42`	`42`	`{`
`43`	`43`	`const size_t size = 256;`
`44`	`44`
`45`		`- dpnp_queue_initialize_c(QueueOptions::CPU_SELECTOR);`
	`45`	`+ dpnp_queue_initialize_c();`
`46`	`46`	`std::cout << "SYCL queue is CPU: " << dpnp_queue_is_cpu_c() << std::endl;`
`47`	`47`
`48`	`48`	`int* array1 = (int)dpnp_memory_alloc_c(size sizeof(int));`