time-to-botec

Benchmark sampling in different programming languages
Log | Files | Refs | README

scusumkbn2.js (2963B)


      1 /**
      2 * @license Apache-2.0
      3 *
      4 * Copyright (c) 2020 The Stdlib Authors.
      5 *
      6 * Licensed under the Apache License, Version 2.0 (the "License");
      7 * you may not use this file except in compliance with the License.
      8 * You may obtain a copy of the License at
      9 *
     10 *    http://www.apache.org/licenses/LICENSE-2.0
     11 *
     12 * Unless required by applicable law or agreed to in writing, software
     13 * distributed under the License is distributed on an "AS IS" BASIS,
     14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     15 * See the License for the specific language governing permissions and
     16 * limitations under the License.
     17 */
     18 
     19 'use strict';
     20 
     21 // MODULES //
     22 
     23 var float64ToFloat32 = require( '@stdlib/number/float64/base/to-float32' );
     24 var abs = require( '@stdlib/math/base/special/abs' );
     25 
     26 
     27 // MAIN //
     28 
     29 /**
     30 * Computes the cumulative sum of single-precision floating-point strided array elements using a second-order iterative Kahan–Babuška algorithm.
     31 *
     32 * ## Method
     33 *
     34 * -   This implementation uses a second-order iterative Kahan–Babuška algorithm, as described by Klein (2005).
     35 *
     36 * ## References
     37 *
     38 * -   Klein, Andreas. 2005. "A Generalized Kahan-Babuška-Summation-Algorithm." _Computing_ 76 (3): 279–93. doi:[10.1007/s00607-005-0139-x](https://doi.org/10.1007/s00607-005-0139-x).
     39 *
     40 * @param {PositiveInteger} N - number of indexed elements
     41 * @param {number} sum - initial sum
     42 * @param {Float32Array} x - input array
     43 * @param {integer} strideX - `x` stride length
     44 * @param {Float32Array} y - output array
     45 * @param {integer} strideY - `y` stride length
     46 * @returns {Float32Array} output array
     47 *
     48 * @example
     49 * var Float32Array = require( '@stdlib/array/float32' );
     50 *
     51 * var x = new Float32Array( [ 1.0, -2.0, 2.0 ] );
     52 * var y = new Float32Array( x.length );
     53 * var N = x.length;
     54 *
     55 * var v = scusumkbn2( N, 0.0, x, 1, y, 1 );
     56 * // returns <Float32Array>[ 1.0, -1.0, 1.0 ]
     57 */
     58 function scusumkbn2( N, sum, x, strideX, y, strideY ) {
     59 	var ccs;
     60 	var ix;
     61 	var iy;
     62 	var cs;
     63 	var cc;
     64 	var v;
     65 	var t;
     66 	var c;
     67 	var i;
     68 
     69 	if ( N <= 0 ) {
     70 		return y;
     71 	}
     72 	if ( strideX < 0 ) {
     73 		ix = (1-N) * strideX;
     74 	} else {
     75 		ix = 0;
     76 	}
     77 	if ( strideY < 0 ) {
     78 		iy = (1-N) * strideY;
     79 	} else {
     80 		iy = 0;
     81 	}
     82 	ccs = 0.0; // second order correction term for lost low order bits
     83 	cs = 0.0; // first order correction term for lost low order bits
     84 	for ( i = 0; i < N; i++ ) {
     85 		v = x[ ix ];
     86 		t = float64ToFloat32( sum+v );
     87 		if ( abs( sum ) >= abs( v ) ) {
     88 			c = float64ToFloat32( float64ToFloat32( sum-t ) + v );
     89 		} else {
     90 			c = float64ToFloat32( float64ToFloat32( v-t ) + sum );
     91 		}
     92 		sum = t;
     93 		t = float64ToFloat32( cs+c );
     94 		if ( abs( cs ) >= abs( c ) ) {
     95 			cc = float64ToFloat32( float64ToFloat32( cs-t ) + c );
     96 		} else {
     97 			cc = float64ToFloat32( float64ToFloat32( c-t ) + cs );
     98 		}
     99 		cs = t;
    100 		ccs = float64ToFloat32( ccs+cc );
    101 
    102 		y[ iy ] = float64ToFloat32( sum + float64ToFloat32( cs+ccs ) );
    103 		ix += strideX;
    104 		iy += strideY;
    105 	}
    106 	return y;
    107 }
    108 
    109 
    110 // EXPORTS //
    111 
    112 module.exports = scusumkbn2;