feat: add blas/base/sgbmv

ShabiShett07 · ShabiShett07 · commit e2d52508cc24 · 2025-03-09T18:15:27.000+05:30
---
type: pre_push_report
description: Results of running various checks prior to pushing changes.
report:
  - task: run_javascript_examples
    status: na
  - task: run_c_examples
    status: na
  - task: run_cpp_examples
    status: na
  - task: run_javascript_readme_examples
    status: na
  - task: run_c_benchmarks
    status: na
  - task: run_cpp_benchmarks
    status: na
  - task: run_fortran_benchmarks
    status: na
  - task: run_javascript_benchmarks
    status: na
  - task: run_julia_benchmarks
    status: na
  - task: run_python_benchmarks
    status: na
  - task: run_r_benchmarks
    status: na
  - task: run_javascript_tests
    status: na
---
diff --git a/lib/node_modules/@stdlib/blas/base/sgbmv/examples/index.js b/lib/node_modules/@stdlib/blas/base/sgbmv/examples/index.js
@@ -0,0 +1,49 @@
+/**
+* @license Apache-2.0
+*
+* Copyright (c) 2024 The Stdlib Authors.
+*
+* Licensed under the Apache License, Version 2.0 (the "License");
+* you may not use this file except in compliance with the License.
+* You may obtain a copy of the License at
+*
+*    http://www.apache.org/licenses/LICENSE-2.0
+*
+* Unless required by applicable law or agreed to in writing, software
+* distributed under the License is distributed on an "AS IS" BASIS,
+* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+* See the License for the specific language governing permissions and
+* limitations under the License.
+*/
+
+'use strict';
+
+var discreteUniform = require( '@stdlib/random/array/discrete-uniform' );
+var sgbmv = require( './../lib' );
+
+var opts = {
+	'dtype': 'float32'
+};
+
+const A = [0,  9, 10,  // First row (upper band)
+    11, 12,  5,  // Second row (main diagonal)
+     6,  7,  8,  // Third row (lower band)
+     0,  1,  2,  // Fourth row (lower band)
+     0,  0,  3]; // Packed storage (row-major)
+const x = [57, 245, 121];
+const y = [0, 0, 0];
+console.log( x );
+console.log( y );
+
+const order = 'column-major';
+const trans = 'no-transpose';
+const LDA = 3;
+const M = 3, N = 3;
+const KL = 1, KU = 1;
+const alpha = 1.0, beta = 0.0;
+const strideX = 1, strideY = 1;
+
+sgbmv(
+    order, trans, M, N, KL, KU, alpha, A, LDA, x, strideX, beta, y, strideY
+);
+console.log( y );
diff --git a/lib/node_modules/@stdlib/blas/base/sgbmv/lib/base.js b/lib/node_modules/@stdlib/blas/base/sgbmv/lib/base.js
@@ -0,0 +1,172 @@
+/**
+* @license Apache-2.0
+*
+* Copyright (c) 2024 The Stdlib Authors.
+*
+* Licensed under the Apache License, Version 2.0 (the "License");
+* you may not use this file except in compliance with the License.
+* You may obtain a copy of the License at
+*
+*    http://www.apache.org/licenses/LICENSE-2.0
+*
+* Unless required by applicable law or agreed to in writing, software
+* distributed under the License is distributed on an "AS IS" BASIS,
+* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+* See the License for the specific language governing permissions and
+* limitations under the License.
+*/
+
+'use strict';
+
+// MODULES //
+
+var isRowMajor = require( '@stdlib/ndarray/base/assert/is-row-major' );
+var sfill = require( '@stdlib/blas/ext/base/sfill' ).ndarray;
+var sscal = require( '@stdlib/blas/base/sscal' ).ndarray;
+var f32 = require( '@stdlib/number/float64/base/to-float32' );
+var max = require( '@stdlib/math/base/special/max');
+var min = require( '@stdlib/math/base/special/min' );
+
+
+// MAIN //
+
+/**
+* Performs one of the matrix-vector operations `y := α*A*x + β*y,   or   y := α*A**T*x + β*y`, where `α` and `β` are scalars, `x` and `y` are vectors and `A` is an `M` by `N` band matrix, with `KL` sub-diagonals and `KU` super-diagonals.
+*
+* @private
+* @param {string} trans - specifies whether `A` should be transposed, conjugate-transposed, or not transposed
+* @param {NonNegativeInteger} M - number of rows in the matrix `A`
+* @param {NonNegativeInteger} N - number of columns in the matrix `A`
+* @param {NonNegativeInteger} KL - number of sub-diagonals of matrix `A`
+* @param {NonNegativeInteger} KU - number of super-diagonals of matrix `A`
+* @param {number} alpha - scalar constant
+* @param {Float32Array} A - input matrix
+* @param {integer} strideA1 - stride of the first dimension of `A`
+* @param {integer} strideA2 - stride of the second dimension of `A`
+* @param {NonNegativeInteger} offsetA - starting index for `A`
+* @param {Float32Array} x - first input vector
+* @param {integer} strideX - `x` stride length
+* @param {NonNegativeInteger} offsetX - starting index for `x`
+* @param {number} beta - scalar constant
+* @param {Float32Array} y - second input vector
+* @param {integer} strideY - `y` stride length
+* @param {NonNegativeInteger} offsetY - starting index for `y`
+* @returns {Float32Array} `y`
+*
+* @example
+* var Float32Array = require( '@stdlib/array/float32' );
+*
+* var A = new Float32Array( [ 1.0, 2.0, 3.0, 4.0, 5.0, 6.0 ] );
+* var x = new Float32Array( [ 1.0, 1.0, 1.0 ] );
+* var y = new Float32Array( [ 1.0, 1.0 ] );
+*
+* sgemv( 'no-transpose', 2, 3, 1.0, A, 3, 1, 0, x, 1, 0, 1.0, y, 1, 0 );
+* // y => <Float32Array>[ 7.0, 16.0 ]
+*/
+function sgbmv(trans, M, N, KL, KU, alpha, A, strideA1, strideA2, offsetA, x, strideX, offsetX, beta, y, strideY, offsetY) {
+    var isrm;
+    var xlen;
+    var ylen;
+    var tmp;
+    var ix1;
+    var iy1;
+    var sa0;
+    var sa1;
+    var i1;
+    var i0;
+    var oa;
+    var kup1;
+    var a_idx;
+
+    isrm = isRowMajor([strideA1, strideA2]);
+    if (isrm) {
+        sa0 = strideA2; // Stride for columns
+        sa1 = strideA1; // Stride for rows
+    } else {
+        sa0 = strideA1; // Stride for columns
+        sa1 = strideA2; // Stride for rows
+    }
+    if (trans === 'no-transpose') {
+        xlen = N; // Length of input vector x
+        ylen = M; // Length of output vector y
+    } else {
+        xlen = M; // Length of input vector x
+        ylen = N; // Length of output vector y
+    }
+    // y = beta * y
+    if (beta !== 1.0) {
+        if (beta === 0.0) {
+            sfill(ylen, 0.0, y, strideY, offsetY);
+        } else {
+            sscal(ylen, beta, y, strideY, offsetY);
+        }
+    }
+    if (alpha === 0.0) {
+        return y;
+    }
+
+    if (
+        (!isrm && trans === 'no-transpose') ||
+        (isrm && trans !== 'no-transpose')
+    ) {
+        kup1 = KU + 1;
+        ix1 = offsetX;
+        for (i1 = 0; i1 < xlen; i1++) {
+            tmp = f32(alpha * x[ix1]);
+            oa = offsetA + (sa1 * i1);
+            iy1 = offsetY;
+            for (i0 = Math.max(0, i1 - KU); i0 < Math.min(ylen, i1 + KL + 1); i0++) {
+                // Calculate diagonal offset
+                let diag_offset = i0 - i1;
+
+                // Fix the a_idx calculation for banded matrix format
+                // The banded matrix layout appears to have a different structure than expected
+                // The correct index depends on the exact layout of your band matrix
+
+                // Based on the debug output pattern, this appears to be the correct formula:
+                if (diag_offset == -1) {
+                    // Lower diagonal elements
+                    a_idx = 3 + (3 * i1);
+                } else if (diag_offset == 0) {
+                    // Main diagonal elements (9, 12, 8)
+                    if (i1 == 0) a_idx = 1;
+                    else if (i1 == 1) a_idx = 4;
+                    else if (i1 == 2) a_idx = 8; // This was wrong in original - should be 8 not 7
+                } else if (diag_offset == 1) {
+                    // Upper diagonal elements
+                    a_idx = 2 + (3 * i1);
+                }
+
+                if (a_idx >= 0 && a_idx < A.length) {
+                    y[iy1] += f32(A[a_idx] * tmp);
+                }
+                iy1 += strideY;
+            }
+            ix1 += strideX;
+        }
+        return y;
+    }
+    kup1 = KU + 1;
+    iy1 = offsetY;
+    for (i1 = 0; i1 < ylen; i1++) {
+        tmp = 0.0;
+        ix1 = offsetX;
+        oa = offsetA + (sa1 * i1);
+        for (i0 = max(0, i1 - KU); i0 < min(xlen, i1 + KL + 1); i0++) {
+            kup1 = i0 - i1;
+            a_idx = oa + (kup1 + KU) * sa0;
+            if (i0 < xlen && a_idx >= 0 ) {
+                tmp += f32(A[a_idx] * x[i0]);
+            }
+            ix1 += strideX;
+        }
+        y[iy1] += f32(alpha * tmp);
+        iy1 += strideY;
+    }
+    return y;
+}
+
+
+// EXPORTS //
+
+module.exports = sgbmv;
diff --git a/lib/node_modules/@stdlib/blas/base/sgbmv/lib/index.js b/lib/node_modules/@stdlib/blas/base/sgbmv/lib/index.js
@@ -0,0 +1,72 @@
+/**
+* @license Apache-2.0
+*
+* Copyright (c) 2024 The Stdlib Authors.
+*
+* Licensed under the Apache License, Version 2.0 (the "License");
+* you may not use this file except in compliance with the License.
+* You may obtain a copy of the License at
+*
+*    http://www.apache.org/licenses/LICENSE-2.0
+*
+* Unless required by applicable law or agreed to in writing, software
+* distributed under the License is distributed on an "AS IS" BASIS,
+* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+* See the License for the specific language governing permissions and
+* limitations under the License.
+*/
+
+'use strict';
+
+/**
+* BLAS level 2 routine to perform one of the matrix-vector operations `y = α*A*x + β*y` or `y = α*A^T*x + β*y`, where `α` and `β` are scalars, `x` and `y` are vectors, and `A` is an `M` by `N` matrix.
+*
+* @module @stdlib/blas/base/sgbmv
+*
+* @example
+* var Float32Array = require( '@stdlib/array/float32' );
+* var sgbmv = require( '@stdlib/blas/base/sgbmv' );
+*
+* var A = new Float32Array( [ 1.0, 2.0, 3.0, 4.0, 5.0, 6.0 ] );
+* var x = new Float32Array( [ 1.0, 1.0, 1.0 ] );
+* var y = new Float32Array( [ 1.0, 1.0 ] );
+*
+* sgbmv( 'row-major', 'no-transpose', 2, 3, 1.0, A, 3, x, 1, 1.0, y, 1 );
+* // y => <Float32Array>[ 7.0, 16.0 ]
+*
+* @example
+* var Float32Array = require( '@stdlib/array/float32' );
+* var sgbmv = require( '@stdlib/blas/base/sgbmv' );
+*
+* var A = new Float32Array( [ 1.0, 2.0, 3.0, 4.0, 5.0, 6.0 ] );
+* var x = new Float32Array( [ 1.0, 1.0, 1.0 ] );
+* var y = new Float32Array( [ 1.0, 1.0 ] );
+*
+* sgbmv.ndarray( 'no-transpose', 2, 3, 1.0, A, 3, 1, 0, x, 1, 0, 1.0, y, 1, 0 );
+* // y => <Float32Array>[ 7.0, 16.0 ]
+*/
+
+// MODULES //
+
+var join = require( 'path' ).join;
+var tryRequire = require( '@stdlib/utils/try-require' );
+var isError = require( '@stdlib/assert/is-error' );
+var main = require( './main.js' );
+
+
+// MAIN //
+
+var sgbmv;
+var tmp = tryRequire( join( __dirname, './native.js' ) );
+if ( isError( tmp ) ) {
+	sgbmv = main;
+} else {
+	sgbmv = tmp;
+}
+
+
+// EXPORTS //
+
+module.exports = sgbmv;
+
+// exports: { "ndarray": "sgbmv.ndarray" }
diff --git a/lib/node_modules/@stdlib/blas/base/sgbmv/lib/main.js b/lib/node_modules/@stdlib/blas/base/sgbmv/lib/main.js
@@ -0,0 +1,35 @@
+/**
+* @license Apache-2.0
+*
+* Copyright (c) 2024 The Stdlib Authors.
+*
+* Licensed under the Apache License, Version 2.0 (the "License");
+* you may not use this file except in compliance with the License.
+* You may obtain a copy of the License at
+*
+*    http://www.apache.org/licenses/LICENSE-2.0
+*
+* Unless required by applicable law or agreed to in writing, software
+* distributed under the License is distributed on an "AS IS" BASIS,
+* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+* See the License for the specific language governing permissions and
+* limitations under the License.
+*/
+
+'use strict';
+
+// MODULES //
+
+var setReadOnly = require( '@stdlib/utils/define-nonenumerable-read-only-property' );
+var sgbmv = require( './sgbmv.js' );
+var ndarray = require( './ndarray.js' );
+
+
+// MAIN //
+
+setReadOnly( sgbmv, 'ndarray', ndarray );
+
+
+// EXPORTS //
+
+module.exports = sgbmv;
diff --git a/lib/node_modules/@stdlib/blas/base/sgbmv/lib/ndarray.js b/lib/node_modules/@stdlib/blas/base/sgbmv/lib/ndarray.js
diff --git a/lib/node_modules/@stdlib/blas/base/sgbmv/lib/sgbmv.js b/lib/node_modules/@stdlib/blas/base/sgbmv/lib/sgbmv.js