Press n or j to go to the next uncovered block, b, p or k for the previous block.
| 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 | 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 3x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 52x 4x 4x 48x 48x 48x 48x 48x 48x 48x 48x 48x 52x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 24x 48x 48x 48x 48x 48x 48x 48x 52x 142x 142x 142x 142x 142x 10x 142x 132x 132x 132x 132x 396x 396x 396x 396x 396x 396x 132x 142x 142x 142x 48x 52x 3x 3x 3x 3x 3x | /**
* @license Apache-2.0
*
* Copyright (c) 2026 The Stdlib Authors.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
'use strict';
// MODULES //
var isRowMajor = require( '@stdlib/ndarray/base/assert/is-row-major' );
var realf = require( '@stdlib/complex/float32/real' );
var imagf = require( '@stdlib/complex/float32/imag' );
var f32 = require( '@stdlib/number/float64/base/to-float32' );
var reinterpret = require( '@stdlib/strided/base/reinterpret-complex64' );
var muladd = require( '@stdlib/complex/float32/base/mul-add' ).assign;
// MAIN //
/**
* Performs the rank 1 operation `A = α*x*y^T + A`, where `α` is a scalar, `x` is an `M` element vector, `y` is an `N` element vector, and `A` is an `M` by `N` matrix.
*
* @private
* @param {NonNegativeInteger} M - number of rows in the matrix `A`
* @param {NonNegativeInteger} N - number of columns in the matrix `A`
* @param {Complex64} alpha - scalar constant
* @param {Complex64Array} x - first input vector
* @param {integer} strideX - `x` stride length
* @param {NonNegativeInteger} offsetX - starting index for `x`
* @param {Complex64Array} y - second input vector
* @param {integer} strideY - `y` stride length
* @param {NonNegativeInteger} offsetY - starting index for `y`
* @param {Complex64Array} A - input matrix
* @param {integer} strideA1 - stride of the first dimension of `A`
* @param {integer} strideA2 - stride of the second dimension of `A`
* @param {NonNegativeInteger} offsetA - starting index for `A`
* @returns {Complex64Array} `A`
*
* @example
* var Complex64Array = require( '@stdlib/array/complex64' );
* var Complex64 = require( '@stdlib/complex/float32/ctor' );
*
* var A = new Complex64Array( [ 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0 ] );
* var x = new Complex64Array( [ 1.0, 1.0, 2.0, 2.0 ] );
* var y = new Complex64Array( [ 3.0, 3.0, 2.0, 2.0, 1.0, 1.0 ] );
* var alpha = new Complex64( 0.5, 0.5 );
*
* cgeru( 2, 3, alpha, x, 1, 0, y, 1, 0, A, 3, 1, 0 );
* // A => <Complex64Array>[ -2.0, 4.0, 0.0, 4.0, 2.0, 4.0, -2.0, 10.0, 1.0, 9.0, 4.0, 8.0 ]
*/
function cgeru( M, N, alpha, x, strideX, offsetX, y, strideY, offsetY, A, strideA1, strideA2, offsetA ) { // eslint-disable-line max-params, max-len
var realpha;
var imalpha;
var viewA;
var viewX;
var viewY;
var retmp;
var imtmp;
var tmp;
var rex;
var imx;
var rey;
var imy;
var sa1;
var sa2;
var da0;
var da1;
var S0;
var S1;
var oa;
var ox;
var oy;
var sx;
var sy;
var ia;
var ix;
var iy;
var i0;
var i1;
// Note on variable naming convention: S#, da#, ia#, i# where # corresponds to the loop number, with `0` being the innermost loop...
// Decompose scalars into real and imaginary components:
realpha = realf( alpha );
imalpha = imagf( alpha );
if ( realpha === 0.0 && imalpha === 0.0 ) {
return A;
}
oa = offsetA * 2;
sa1 = strideA1 * 2;
sa2 = strideA2 * 2;
ox = offsetX * 2;
oy = offsetY * 2;
sx = strideX * 2;
sy = strideY * 2;
// Extract loop variables for purposes of loop interchange: dimensions and loop offset (pointer) increments...
if ( isRowMajor( [ strideA1, strideA2 ] ) ) {
// For row-major matrices, the last dimension has the fastest changing index...
S0 = N;
S1 = M;
da0 = sa2; // offset increment for innermost loop
da1 = sa1 - (S0*sa2); // offset increment for outermost loop
// Swap the vectors...
tmp = x;
x = y;
y = tmp;
tmp = sx;
sx = sy;
sy = tmp;
tmp = ox;
ox = oy;
oy = tmp;
} else { // order === 'column-major'
// For column-major matrices, the first dimension has the fastest changing index...
S0 = M;
S1 = N;
da0 = sa1; // offset increment for innermost loop
da1 = sa2 - (S0*sa1); // offset increment for outermost loop
}
// Reinterpret arrays as real-valued views of interleaved real and imaginary components:
viewA = reinterpret( A, 0 );
viewX = reinterpret( x, 0 );
viewY = reinterpret( y, 0 );
ix = ox;
iy = oy;
ia = oa;
for ( i1 = 0; i1 < S1; i1++ ) {
rey = viewY[ iy ];
imy = viewY[ iy+1 ];
// Check whether we can avoid the inner loop entirely...
if ( rey === 0.0 && imy === 0.0 ) {
ia += da0 * S0;
} else {
retmp = f32(f32(realpha*rey) - f32(imalpha*imy));
imtmp = f32(f32(realpha*imy) + f32(imalpha*rey));
ix = ox;
for ( i0 = 0; i0 < S0; i0++ ) {
rex = viewX[ ix ];
imx = viewX[ ix+1 ];
muladd( rex, imx, retmp, imtmp, viewA[ ia ], viewA[ ia+1 ], viewA, 1, ia ); // eslint-disable-line max-len
ix += sx;
ia += da0;
}
}
iy += sy;
ia += da1;
}
return A;
}
// EXPORTS //
module.exports = cgeru;
|