Skip to content

Commit 0229b71

Browse files
committed
feat: add remaining kernels
--- type: pre_commit_static_analysis_report description: Results of running static analysis checks when committing changes. report: - task: lint_filenames status: passed - task: lint_editorconfig status: passed - task: lint_markdown status: na - task: lint_package_json status: na - task: lint_repl_help status: na - task: lint_javascript_src status: passed - task: lint_javascript_cli status: na - task: lint_javascript_examples status: na - task: lint_javascript_tests status: na - task: lint_javascript_benchmarks status: na - task: lint_python status: na - task: lint_r status: na - task: lint_c_src status: na - task: lint_c_examples status: na - task: lint_c_benchmarks status: na - task: lint_c_tests_fixtures status: na - task: lint_shell status: na - task: lint_typescript_declarations status: na - task: lint_typescript_tests status: na - task: lint_license_headers status: passed ---
1 parent 27ddd92 commit 0229b71

File tree

12 files changed

+4242
-0
lines changed

12 files changed

+4242
-0
lines changed
Lines changed: 306 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,306 @@
1+
/**
2+
* @license Apache-2.0
3+
*
4+
* Copyright (c) 2025 The Stdlib Authors.
5+
*
6+
* Licensed under the Apache License, Version 2.0 (the "License");
7+
* you may not use this file except in compliance with the License.
8+
* You may obtain a copy of the License at
9+
*
10+
* http://www.apache.org/licenses/LICENSE-2.0
11+
*
12+
* Unless required by applicable law or agreed to in writing, software
13+
* distributed under the License is distributed on an "AS IS" BASIS,
14+
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15+
* See the License for the specific language governing permissions and
16+
* limitations under the License.
17+
*/
18+
19+
/* eslint-disable max-len, max-params, max-depth, max-statements */
20+
21+
'use strict';
22+
23+
// MODULES //
24+
25+
var copyIndexed = require( '@stdlib/array/base/copy-indexed' );
26+
var incrementOffsets = require( './increment_offsets.js' );
27+
var setViewOffsets = require( './set_view_offsets.js' );
28+
var offsets = require( './offsets.js' );
29+
var wrap = require( './callback_wrapper.js' );
30+
31+
32+
// MAIN //
33+
34+
/**
35+
* Performs a reduction over an input ndarray according to callback function and assigns results to a provided output ndarray.
36+
*
37+
* @private
38+
* @param {Function} fcn - wrapper for a one-dimensional strided array reduction function
39+
* @param {Array<Object>} arrays - ndarrays
40+
* @param {Function} strategy - input ndarray reshape strategy
41+
* @param {Array<Object>} views - initialized ndarray-like objects representing sub-array views
42+
* @param {NonNegativeIntegerArray} ibuf - workspace for storing iteration indices
43+
* @param {NonNegativeIntegerArray} ldims - list of loop dimensions
44+
* @param {NonNegativeIntegerArray} cdims - list of "core" dimensions
45+
* @param {IntegerArray} strides - loop dimension strides for the input ndarray
46+
* @param {boolean} isRowMajor - boolean indicating whether the input ndarray is row-major
47+
* @param {Options} opts - function options
48+
* @param {boolean} hasOpts - boolean indicating whether to pass an options argument to a reduction function
49+
* @param {Function} clbk - callback function
50+
* @param {*} thisArg - callback exection context
51+
* @returns {void}
52+
*
53+
* @example
54+
* var Float64Array = require( '@stdlib/array/float64' );
55+
* var ndarray2array = require( '@stdlib/ndarray/base/to-array' );
56+
* var zeros = require( '@stdlib/array/base/zeros' );
57+
* var maxBy = require( '@stdlib/stats/base/ndarray/max-by' );
58+
*
59+
* function clbk( value ) {
60+
* return value * 2.0;
61+
* }
62+
*
63+
* // Create data buffers:
64+
* var xbuf = new Float64Array( [ 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 10.0, 11.0, 12.0 ] );
65+
* var ybuf = new Float64Array( [ 0.0, 0.0, 0.0 ] );
66+
*
67+
* // Define the array shapes:
68+
* var xsh = [ 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 2, 2 ];
69+
* var ysh = [ 1, 1, 1, 1, 1, 1, 1, 1, 1, 3 ];
70+
*
71+
* // Define the array strides:
72+
* var sx = [ 12, 12, 12, 12, 12, 12, 12, 12, 12, 4, 2, 1 ];
73+
* var sy = [ 3, 3, 3, 3, 3, 3, 3, 3, 3, 1 ];
74+
*
75+
* // Define the index offsets:
76+
* var ox = 0;
77+
* var oy = 0;
78+
*
79+
* // Create an input ndarray-like object:
80+
* var x = {
81+
* 'dtype': 'float64',
82+
* 'data': xbuf,
83+
* 'shape': xsh,
84+
* 'strides': sx,
85+
* 'offset': ox,
86+
* 'order': 'row-major'
87+
* };
88+
*
89+
* // Create an output ndarray-like object:
90+
* var y = {
91+
* 'dtype': 'float64',
92+
* 'data': ybuf,
93+
* 'shape': ysh,
94+
* 'strides': sy,
95+
* 'offset': oy,
96+
* 'order': 'row-major'
97+
* };
98+
*
99+
* // Initialize ndarray-like objects representing sub-array views:
100+
* var views = [
101+
* {
102+
* 'dtype': x.dtype,
103+
* 'data': x.data,
104+
* 'shape': [ 2, 2 ],
105+
* 'strides': [ 2, 1 ],
106+
* 'offset': x.offset,
107+
* 'order': x.order
108+
* }
109+
* ];
110+
*
111+
* // Define a reshape strategy:
112+
* function strategy( x ) {
113+
* return {
114+
* 'dtype': x.dtype,
115+
* 'data': x.data,
116+
* 'shape': [ 4 ],
117+
* 'strides': [ 1 ],
118+
* 'offset': x.offset,
119+
* 'order': x.order
120+
* };
121+
* }
122+
*
123+
* // Create a workspace array for storing iteration indices:
124+
* var ibuf = zeros( xsh.length );
125+
*
126+
* // Define the loop and core dimensions:
127+
* var ldims = [ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9 ];
128+
* var cdims = [ 10, 11 ];
129+
*
130+
* // Resolve the loop dimension strides for the input array:
131+
* var slx = [ 12, 12, 12, 12, 12, 12, 12, 12, 12, 4 ];
132+
*
133+
* // Perform a reduction:
134+
* unary10d( maxBy, [ x, y ], strategy, views, ibuf, ldims, cdims, slx, true, {}, false, clbk );
135+
*
136+
* var arr = ndarray2array( y.data, y.shape, y.strides, y.offset, y.order );
137+
* // returns [ [ [ [ [ [ [ [ [ [ 8.0, 16.0, 24.0 ] ] ] ] ] ] ] ] ] ]
138+
*/
139+
function unary10d( fcn, arrays, strategy, views, ibuf, ldims, cdims, strides, isRowMajor, opts, hasOpts, clbk, thisArg ) {
140+
var ybuf;
141+
var dv0;
142+
var dv1;
143+
var dv2;
144+
var dv3;
145+
var dv4;
146+
var dv5;
147+
var dv6;
148+
var dv7;
149+
var dv8;
150+
var dv9;
151+
var sh;
152+
var S0;
153+
var S1;
154+
var S2;
155+
var S3;
156+
var S4;
157+
var S5;
158+
var S6;
159+
var S7;
160+
var S8;
161+
var S9;
162+
var sv;
163+
var iv;
164+
var i0;
165+
var i1;
166+
var i2;
167+
var i3;
168+
var i4;
169+
var i5;
170+
var i6;
171+
var i7;
172+
var i8;
173+
var i9;
174+
var y;
175+
var v;
176+
var i;
177+
var f;
178+
179+
// Note on variable naming convention: S#, dv#, i# where # corresponds to the loop number, with `0` being the innermost loop...
180+
181+
// Resolve the output ndarray and associated shape:
182+
y = arrays[ 1 ];
183+
sh = y.shape;
184+
185+
// Extract loop variables for purposes of loop interchange: dimensions and loop offset (pointer) increments...
186+
if ( isRowMajor ) {
187+
// For row-major ndarrays, the last dimensions have the fastest changing indices...
188+
S0 = sh[ 9 ];
189+
S1 = sh[ 8 ];
190+
S2 = sh[ 7 ];
191+
S3 = sh[ 6 ];
192+
S4 = sh[ 5 ];
193+
S5 = sh[ 4 ];
194+
S6 = sh[ 3 ];
195+
S7 = sh[ 2 ];
196+
S8 = sh[ 1 ];
197+
S9 = sh[ 0 ];
198+
dv0 = [ strides[9] ]; // offset increment for innermost loop
199+
dv1 = [ strides[8] - ( S0*strides[9] ) ];
200+
dv2 = [ strides[7] - ( S1*strides[8] ) ];
201+
dv3 = [ strides[6] - ( S2*strides[7] ) ];
202+
dv4 = [ strides[5] - ( S3*strides[6] ) ];
203+
dv5 = [ strides[4] - ( S4*strides[5] ) ];
204+
dv6 = [ strides[3] - ( S5*strides[4] ) ];
205+
dv7 = [ strides[2] - ( S6*strides[3] ) ];
206+
dv8 = [ strides[1] - ( S7*strides[2] ) ];
207+
dv9 = [ strides[0] - ( S8*strides[1] ) ]; // offset increment for outermost loop
208+
for ( i = 1; i < arrays.length; i++ ) {
209+
sv = arrays[ i ].strides;
210+
dv0.push( sv[9] );
211+
dv1.push( sv[8] - ( S0*sv[9] ) );
212+
dv2.push( sv[7] - ( S1*sv[8] ) );
213+
dv3.push( sv[6] - ( S2*sv[7] ) );
214+
dv4.push( sv[5] - ( S3*sv[6] ) );
215+
dv5.push( sv[4] - ( S4*sv[5] ) );
216+
dv6.push( sv[3] - ( S5*sv[4] ) );
217+
dv7.push( sv[2] - ( S6*sv[3] ) );
218+
dv8.push( sv[1] - ( S7*sv[2] ) );
219+
dv9.push( sv[0] - ( S8*sv[1] ) );
220+
}
221+
} else { // order === 'column-major'
222+
// For column-major ndarrays, the first dimensions have the fastest changing indices...
223+
S0 = sh[ 0 ];
224+
S1 = sh[ 1 ];
225+
S2 = sh[ 2 ];
226+
S3 = sh[ 3 ];
227+
S4 = sh[ 4 ];
228+
S5 = sh[ 5 ];
229+
S6 = sh[ 6 ];
230+
S7 = sh[ 7 ];
231+
S8 = sh[ 8 ];
232+
S9 = sh[ 9 ];
233+
dv0 = [ strides[0] ]; // offset increment for innermost loop
234+
dv1 = [ strides[1] - ( S0*strides[0] ) ];
235+
dv2 = [ strides[2] - ( S1*strides[1] ) ];
236+
dv3 = [ strides[3] - ( S2*strides[2] ) ];
237+
dv4 = [ strides[4] - ( S3*strides[3] ) ];
238+
dv5 = [ strides[5] - ( S4*strides[4] ) ];
239+
dv6 = [ strides[6] - ( S5*strides[5] ) ];
240+
dv7 = [ strides[7] - ( S6*strides[6] ) ];
241+
dv8 = [ strides[8] - ( S7*strides[7] ) ];
242+
dv9 = [ strides[9] - ( S8*strides[8] ) ]; // offset increment for outermost loop
243+
for ( i = 1; i < arrays.length; i++ ) {
244+
sv = arrays[ i ].strides;
245+
dv0.push( sv[0] );
246+
dv1.push( sv[1] - ( S0*sv[0] ) );
247+
dv2.push( sv[2] - ( S1*sv[1] ) );
248+
dv3.push( sv[3] - ( S2*sv[2] ) );
249+
dv4.push( sv[4] - ( S3*sv[3] ) );
250+
dv5.push( sv[5] - ( S4*sv[4] ) );
251+
dv6.push( sv[6] - ( S5*sv[5] ) );
252+
dv7.push( sv[7] - ( S6*sv[6] ) );
253+
dv8.push( sv[8] - ( S7*sv[7] ) );
254+
dv8.push( sv[8] - ( S8*sv[8] ) );
255+
}
256+
}
257+
// Resolve a list of pointers to the first indexed elements in the respective ndarrays:
258+
iv = offsets( arrays );
259+
260+
// Shallow copy the list of views to an internal array so that we can update with reshaped views without impacting the original list of views:
261+
v = copyIndexed( views );
262+
263+
// Cache a reference to the output ndarray buffer:
264+
ybuf = y.data;
265+
266+
// Iterate over the non-reduced ndarray dimensions...
267+
for ( i9 = 0; i9 < S9; i9++ ) {
268+
for ( i8 = 0; i8 < S8; i8++ ) {
269+
for ( i7 = 0; i7 < S7; i7++ ) {
270+
for ( i6 = 0; i6 < S6; i6++ ) {
271+
for ( i5 = 0; i5 < S5; i5++ ) {
272+
for ( i4 = 0; i4 < S4; i4++ ) {
273+
for ( i3 = 0; i3 < S3; i3++ ) {
274+
for ( i2 = 0; i2 < S2; i2++ ) {
275+
for ( i1 = 0; i1 < S1; i1++ ) {
276+
for ( i0 = 0; i0 < S0; i0++ ) {
277+
setViewOffsets( views, iv );
278+
v[ 0 ] = strategy( views[ 0 ] );
279+
f = wrap( arrays[ 0 ].ref, views[ 0 ], ibuf, ldims, [ i9, i8, i7, i6, i5, i4, i3, i2, i1, i0 ], cdims, clbk, thisArg );
280+
ybuf[ iv[1] ] = ( hasOpts ) ? fcn( v, opts, f ) : fcn( v, f );
281+
incrementOffsets( iv, dv0 );
282+
}
283+
incrementOffsets( iv, dv1 );
284+
}
285+
incrementOffsets( iv, dv2 );
286+
}
287+
incrementOffsets( iv, dv3 );
288+
}
289+
incrementOffsets( iv, dv4 );
290+
}
291+
incrementOffsets( iv, dv5 );
292+
}
293+
incrementOffsets( iv, dv6 );
294+
}
295+
incrementOffsets( iv, dv7 );
296+
}
297+
incrementOffsets( iv, dv8 );
298+
}
299+
incrementOffsets( iv, dv9 );
300+
}
301+
}
302+
303+
304+
// EXPORTS //
305+
306+
module.exports = unary10d;

0 commit comments

Comments
 (0)