feat: add dispatcher

kgryte · saurabhraghuvanshii · commit cbbfdd72914d · 2025-01-19T16:07:20.000+05:30
---
type: pre_commit_static_analysis_report
description: Results of running static analysis checks when committing changes.
report:
  - task: lint_filenames
    status: passed
  - task: lint_editorconfig
    status: passed
  - task: lint_markdown
    status: na
  - task: lint_package_json
    status: na
  - task: lint_repl_help
    status: na
  - task: lint_javascript_src
    status: na
  - task: lint_javascript_cli
    status: na
  - task: lint_javascript_examples
    status: na
  - task: lint_javascript_tests
    status: na
  - task: lint_javascript_benchmarks
    status: na
  - task: lint_python
    status: na
  - task: lint_r
    status: na
  - task: lint_c_src
    status: passed
  - task: lint_c_examples
    status: na
  - task: lint_c_benchmarks
    status: na
  - task: lint_c_tests_fixtures
    status: na
  - task: lint_shell
    status: na
  - task: lint_typescript_declarations
    status: na
  - task: lint_typescript_tests
    status: na
  - task: lint_license_headers
    status: passed
---
diff --git a/lib/node_modules/@stdlib/ndarray/base/unary-accumulate/src/dispatch.c b/lib/node_modules/@stdlib/ndarray/base/unary-accumulate/src/dispatch.c
@@ -0,0 +1,344 @@
+/**
+* @license Apache-2.0
+*
+* Copyright (c) 2025 The Stdlib Authors.
+*
+* Licensed under the Apache License, Version 2.0 (the "License");
+* you may not use this file except in compliance with the License.
+* You may obtain a copy of the License at
+*
+*    http://www.apache.org/licenses/LICENSE-2.0
+*
+* Unless required by applicable law or agreed to in writing, software
+* distributed under the License is distributed on an "AS IS" BASIS,
+* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+* See the License for the specific language governing permissions and
+* limitations under the License.
+*/
+
+#include "stdlib/ndarray/base/unary-accumulate/dispatch_object.h"
+#include "stdlib/ndarray/base/unary-accumulate/typedefs.h"
+#include "stdlib/ndarray/base/iteration_order.h"
+#include "stdlib/ndarray/base/bytes_per_element.h"
+#include "stdlib/ndarray/ctor.h"
+#include <stdint.h>
+#include <stddef.h>
+
+/**
+* Performs a reduction over elements in n-dimensional input ndarray having `ndims-1` singleton dimensions.
+*
+* ## Notes
+*
+* -   If able to successfully perform a reduction, the function returns `0`; otherwise, the function returns an error code.
+*
+* @param f     ndarray function
+* @param x1    input ndarray
+* @param x2    initial value ndarray
+* @param x3    output ndarray
+* @param i     index of the non-singleton dimension
+* @param fcn   callback
+* @return      status code
+*/
+static int8_t stdlib_ndarray_unary_accumulate_1d_squeeze( const ndarrayUnaryAccumulateFcn f, const struct ndarray *x1, const struct ndarray *x2, struct ndarray *x3, const int64_t i, void *fcn ) {
+	int64_t sh[] = { stdlib_ndarray_shape( x1 )[ i ] };
+
+	// Shallow copy and reshape the array...
+	int64_t sx1[] = { stdlib_ndarray_strides( x1 )[ i ] };
+	struct ndarray *x1c = stdlib_ndarray_allocate(
+		stdlib_ndarray_dtype( x1 ),
+		stdlib_ndarray_data( x1 ),
+		1,
+		sh,
+		sx1,
+		stdlib_ndarray_offset( x1 ),
+		stdlib_ndarray_order( x1 ),
+		stdlib_ndarray_index_mode( x1 ),
+		stdlib_ndarray_nsubmodes( x1 ),
+		stdlib_ndarray_submodes( x1 )
+	);
+	if ( x1c == NULL ) {
+		return -1;
+	}
+	// Perform the reduction:
+	struct ndarray *arrays[] = { x1c, x2, x3 };
+	int8_t status = f( arrays, fcn );
+
+	// Free allocated memory:
+	stdlib_ndarray_free( x1c );
+
+	return status;
+}
+
+/**
+* Performs a reduction over elements in a flattened n-dimensional input ndarray.
+*
+* ## Notes
+*
+* -   If able to successfully perform a reduction, the function returns `0`; otherwise, the function returns an error code.
+*
+* @param f     ndarray function
+* @param N     number of elements
+* @param x1    input ndarray
+* @param s1    input ndarray stride length
+* @param x2    initial value ndarray
+* @param x3    output ndarray
+* @param fcn   callback
+* @return      status code
+*/
+static int8_t stdlib_ndarray_unary_accumulate_1d_flatten( const ndarrayUnaryAccumulateFcn f, const int64_t N, const struct ndarray *x1, const int64_t s1, const struct ndarray *x2, struct ndarray *x3, void *fcn ) {
+	// Define the (flattened) strided array shape:
+	int64_t sh[] = { N };
+
+	// Shallow copy and reshape the array...
+	int64_t sx1[] = { s1 };
+	struct ndarray *x1c = stdlib_ndarray_allocate(
+		stdlib_ndarray_dtype( x1 ),
+		stdlib_ndarray_data( x1 ),
+		1,
+		sh,
+		sx1,
+		stdlib_ndarray_offset( x1 ),
+		stdlib_ndarray_order( x1 ),
+		stdlib_ndarray_index_mode( x1 ),
+		stdlib_ndarray_nsubmodes( x1 ),
+		stdlib_ndarray_submodes( x1 )
+	);
+	if ( x1c == NULL ) {
+		return -1;
+	}
+	// Perform the reduction:
+	struct ndarray *arrays[] = { x1c, x2, x3 };
+	int8_t status = f( arrays, fcn );
+
+	// Free allocated memory:
+	stdlib_ndarray_free( x1c );
+
+	return status;
+}
+
+/**
+* Dispatches to an ndarray function according to the dimensionality of provided ndarray arguments.
+*
+* ## Notes
+*
+* -   If able to successfully dispatch, the function returns `0`; otherwise, the function returns an error code.
+*
+* @param obj      object comprised of dispatch tables containing ndarray functions
+* @param arrays   array whose first element is a pointer to an input ndarray, second element is a pointer to a zero-dimensional initial value ndarray, and last element is a pointer to a zero-dimensional output ndarray
+* @param fcn      callback
+* @return         status code
+*
+* @example
+* #include "stdlib/ndarray/base/unary-accumulate/dispatch.h"
+* #include "stdlib/ndarray/base/unary-accumulate/dispatch_object.h"
+* #include "stdlib/ndarray/base/unary-accumulate/typedefs.h"
+* #include "stdlib/ndarray/base/unary-accumulate/bb_b.h"
+* #include "stdlib/ndarray/ctor.h"
+* #include <stdint.h>
+* #include <stdlib.h>
+* #include <stdio.h>
+*
+* // Define a list of ndarray functions:
+* ndarrayUnaryAccumulateFcn functions[] = {
+*     stdlib_ndarray_accumulate_bb_b_0d,
+*     stdlib_ndarray_accumulate_bb_b_1d,
+*     stdlib_ndarray_accumulate_bb_b_2d,
+*     stdlib_ndarray_accumulate_bb_b_3d,
+*     stdlib_ndarray_accumulate_bb_b_4d,
+*     stdlib_ndarray_accumulate_bb_b_5d,
+*     stdlib_ndarray_accumulate_bb_b_6d,
+*     stdlib_ndarray_accumulate_bb_b_7d,
+*     stdlib_ndarray_accumulate_bb_b_8d,
+*     stdlib_ndarray_accumulate_bb_b_9d,
+*     stdlib_ndarray_accumulate_bb_b_10d
+*     stdlib_ndarray_accumulate_bb_b_nd
+* };
+*
+* // Define a list of ndarray functions using loop blocking:
+* ndarrayUnaryAccumulateFcn blocked_functions[] = {
+*     stdlib_ndarray_accumulate_bb_b_2d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_3d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_4d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_5d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_6d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_7d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_8d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_9d_blocked,
+*     stdlib_ndarray_accumulate_bb_b_10d_blocked
+* };
+*
+* // Create a function dispatch object:
+* struct ndarrayUnaryAccumulateDispatchObject obj = {
+*     // Array containing ndarray functions:
+*     functions,
+*
+*     // Number of ndarray functions:
+*     12,
+*
+*     // Array containing ndarray functions using loop blocking:
+*     blocked_functions,
+*
+*     // Number of ndarray functions using loop blocking:
+*     9
+* }
+*
+* // Define a function which performs dispatch:
+* int8_t stdlib_ndarray_accumulate_bb_b( struct ndarray *arrays[], void *fcn ) {
+*     return stdlib_ndarray_unary_accumulate_dispatch( &obj, arrays, fcn );
+* }
+*
+* // ...
+*
+* // Create ndarrays...
+* struct ndarray *x = stdlib_ndarray_allocate( ... );
+* if ( x == NULL ) {
+*     fprintf( stderr, "Error allocating memory.\n" );
+*     exit( EXIT_FAILURE );
+* }
+*
+* struct ndarray *initial = stdlib_ndarray_allocate( ... );
+* if ( y == NULL ) {
+*     fprintf( stderr, "Error allocating memory.\n" );
+*     exit( EXIT_FAILURE );
+* }
+*
+* struct ndarray *out = stdlib_ndarray_allocate( ... );
+* if ( y == NULL ) {
+*     fprintf( stderr, "Error allocating memory.\n" );
+*     exit( EXIT_FAILURE );
+* }
+*
+* // ...
+*
+* // Define a callback:
+* uint8_t add( const uint8_t acc, const uint8_t x ) {
+*     return acc + x;
+* }
+*
+* // Apply the callback:
+* struct ndarray *arrays[] = { x, initial, out };
+* int8_t status = stdlib_ndarray_accumulate_bb_b( arrays, (void *)add );
+* if ( status != 0 ) {
+*     fprintf( stderr, "Error during computation.\n" );
+*     exit( EXIT_FAILURE );
+* }
+*/
+int8_t stdlib_ndarray_unary_accumulate_dispatch( const struct ndarrayUnaryAccumulateDispatchObject *obj, struct ndarray *arrays[], void *fcn ) {
+	const int64_t *sh1;
+	struct ndarray *x1;
+	struct ndarray *x2;
+	struct ndarray *x3;
+	int8_t status;
+	int64_t ndims;
+	int64_t mab1;
+	int64_t mib1;
+	int64_t *s1;
+	int64_t len;
+	int64_t bp1;
+	int8_t io1;
+	int64_t ns;
+	int64_t s;
+	int64_t d;
+	int64_t i;
+
+	// Unpack the arrays:
+	x1 = arrays[ 0 ];
+	x2 = arrays[ 1 ];
+	x3 = arrays[ 3 ];
+
+	ndims = stdlib_ndarray_ndims( x1 );
+
+	// Determine whether we can avoid iteration altogether...
+	if ( ndims == 0 ) {
+		obj->functions[ 0 ]( arrays, fcn );
+		return 0;
+	}
+	sh1 = stdlib_ndarray_shape( x1 );
+
+	// Determine the number of elements and the number of singleton dimensions...
+	len = 1; // number of elements
+	ns = 0;  // number of singleton dimensions
+	for ( i = 0; i < ndims; i++ ) {
+		d = sh1[ i ];
+
+		// Note that, if one of the dimensions is `0`, the length will be `0`...
+		len *= d;
+
+		// Check whether the current dimension is a singleton dimension...
+		if ( d == 1 ) {
+			ns += 1;
+		}
+	}
+	// Check whether we were provided an empty ndarray...
+	if ( len == 0 ) {
+		return 0;
+	}
+	// Determine whether the ndarray is one-dimensional and thus readily translates to a one-dimensional strided array...
+	if ( ndims == 1 ) {
+		obj->functions[ 1 ]( arrays, fcn );
+		return 0;
+	}
+	// Determine whether the ndarray has only **one** non-singleton dimension (e.g., ndims=4, shape=[10,1,1,1]) so that we can treat an ndarray as being equivalent to a one-dimensional strided array...
+	if ( ns == ndims-1 ) {
+		// Get the index of the non-singleton dimension...
+		for ( i = 0; i < ndims; i++ ) {
+			if ( sh1[ i ] != 1 ) {
+				break;
+			}
+		}
+		// Remove the singleton dimensions and apply the callback function...
+		status = stdlib_ndarray_unary_accumulate_1d_squeeze( obj->functions[ 1 ], x1, x2, x3, i, fcn );
+		if ( status == 0 ) {
+			return 0;
+		}
+		// If we failed, this is probably due to failed memory allocation, so fall through and try again...
+	}
+	s1 = stdlib_ndarray_strides( x1 );
+	io1 = stdlib_ndarray_iteration_order( ndims, s1 ); // +/-1
+
+	// Determine whether we can avoid blocked iteration...
+	if ( io1 != 0 ) {
+		// Determine the minimum and maximum linear byte indices which are accessible by the array view:
+		mib1 = stdlib_ndarray_offset( x1 ); // byte offset
+		mab1 = mib1;
+		for ( i = 0; i < ndims; i++ ) {
+			s = s1[ i ]; // units: bytes
+			if ( s > 0 ) {
+				mab1 += s * ( sh1[i]-1 );
+			} else if ( s < 0 ) {
+				mib1 += s * ( sh1[i]-1 ); // decrements
+			}
+		}
+		bp1 = stdlib_ndarray_bytes_per_element( stdlib_ndarray_dtype( x1 ) );
+
+		// Determine whether we can ignore shape (and strides) and treat the ndarray as a linear one-dimensional strided array...
+		if ( ( len*bp1 ) == ( mab1-mib1+bp1 ) ) {
+			// Note: the above is equivalent to @stdlib/ndarray/base/assert/is-contiguous, but in-lined so we can retain computed values...
+			status = stdlib_ndarray_unary_accumulate_1d_flatten( obj->functions[ 1 ], len, x1, io1*bp1, x2, x3, fcn );
+			if ( status == 0 ) {
+				return 0;
+			}
+			// If we failed, this is probably due to failed memory allocation, so fall through and try again...
+		}
+		// The ndarray is non-contiguous, so we cannot directly use one-dimensional array functionality...
+
+		// Determine whether we can use simple nested loops...
+		if ( ndims < (obj->nfunctions) ) {
+			// So long as iteration always moves in the same direction (i.e., no mixed sign strides), we can leverage cache-optimal (i.e., normal) nested loops without resorting to blocked iteration...
+			obj->functions[ ndims ]( arrays, fcn );
+			return 0;
+		}
+		// Fall-through to blocked iteration...
+	}
+	// At this point, we're either dealing with a non-contiguous n-dimensional array or a high dimensional n-dimensional array, so our only hope is that we can still perform blocked iteration...
+
+	// Determine whether we can perform blocked iteration...
+	if ( ndims <= (obj->nblockedfunctions)+1 ) {
+		obj->blocked_functions[ ndims-2 ]( arrays, fcn );
+		return 0;
+	}
+	// Fall-through to linear view iteration without regard for how data is stored in memory (i.e., take the slow path)...
+	obj->functions[ (obj->nfunctions)-1 ]( arrays, fcn );
+
+	return 0;
+}