[2154] | 1 | /*************************************************************************
|
---|
| 2 | Copyright (c) 2005-2007, Sergey Bochkanov (ALGLIB project).
|
---|
| 3 |
|
---|
[2430] | 4 | >>> SOURCE LICENSE >>>
|
---|
| 5 | This program is free software; you can redistribute it and/or modify
|
---|
| 6 | it under the terms of the GNU General Public License as published by
|
---|
| 7 | the Free Software Foundation (www.fsf.org); either version 2 of the
|
---|
| 8 | License, or (at your option) any later version.
|
---|
[2154] | 9 |
|
---|
[2430] | 10 | This program is distributed in the hope that it will be useful,
|
---|
| 11 | but WITHOUT ANY WARRANTY; without even the implied warranty of
|
---|
| 12 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
---|
| 13 | GNU General Public License for more details.
|
---|
[2154] | 14 |
|
---|
[2430] | 15 | A copy of the GNU General Public License is available at
|
---|
| 16 | http://www.fsf.org/licensing/licenses
|
---|
[2154] | 17 |
|
---|
[2430] | 18 | >>> END OF LICENSE >>>
|
---|
[2154] | 19 | *************************************************************************/
|
---|
| 20 |
|
---|
| 21 | using System;
|
---|
| 22 |
|
---|
[2430] | 23 | namespace alglib
|
---|
[2154] | 24 | {
|
---|
[2430] | 25 | public class blas
|
---|
[2154] | 26 | {
|
---|
[2430] | 27 | public static double vectornorm2(ref double[] x,
|
---|
| 28 | int i1,
|
---|
| 29 | int i2)
|
---|
| 30 | {
|
---|
| 31 | double result = 0;
|
---|
| 32 | int n = 0;
|
---|
| 33 | int ix = 0;
|
---|
| 34 | double absxi = 0;
|
---|
| 35 | double scl = 0;
|
---|
| 36 | double ssq = 0;
|
---|
[2154] | 37 |
|
---|
[2430] | 38 | n = i2-i1+1;
|
---|
| 39 | if( n<1 )
|
---|
[2154] | 40 | {
|
---|
[2430] | 41 | result = 0;
|
---|
| 42 | return result;
|
---|
| 43 | }
|
---|
| 44 | if( n==1 )
|
---|
| 45 | {
|
---|
| 46 | result = Math.Abs(x[i1]);
|
---|
| 47 | return result;
|
---|
| 48 | }
|
---|
| 49 | scl = 0;
|
---|
| 50 | ssq = 1;
|
---|
| 51 | for(ix=i1; ix<=i2; ix++)
|
---|
| 52 | {
|
---|
[2563] | 53 | if( (double)(x[ix])!=(double)(0) )
|
---|
[2154] | 54 | {
|
---|
[2430] | 55 | absxi = Math.Abs(x[ix]);
|
---|
[2563] | 56 | if( (double)(scl)<(double)(absxi) )
|
---|
[2430] | 57 | {
|
---|
| 58 | ssq = 1+ssq*AP.Math.Sqr(scl/absxi);
|
---|
| 59 | scl = absxi;
|
---|
| 60 | }
|
---|
| 61 | else
|
---|
| 62 | {
|
---|
| 63 | ssq = ssq+AP.Math.Sqr(absxi/scl);
|
---|
| 64 | }
|
---|
[2154] | 65 | }
|
---|
| 66 | }
|
---|
[2430] | 67 | result = scl*Math.Sqrt(ssq);
|
---|
| 68 | return result;
|
---|
[2154] | 69 | }
|
---|
| 70 |
|
---|
| 71 |
|
---|
[2430] | 72 | public static int vectoridxabsmax(ref double[] x,
|
---|
| 73 | int i1,
|
---|
| 74 | int i2)
|
---|
| 75 | {
|
---|
| 76 | int result = 0;
|
---|
| 77 | int i = 0;
|
---|
| 78 | double a = 0;
|
---|
[2154] | 79 |
|
---|
[2430] | 80 | result = i1;
|
---|
| 81 | a = Math.Abs(x[result]);
|
---|
| 82 | for(i=i1+1; i<=i2; i++)
|
---|
[2154] | 83 | {
|
---|
[2563] | 84 | if( (double)(Math.Abs(x[i]))>(double)(Math.Abs(x[result])) )
|
---|
[2430] | 85 | {
|
---|
| 86 | result = i;
|
---|
| 87 | }
|
---|
[2154] | 88 | }
|
---|
[2430] | 89 | return result;
|
---|
[2154] | 90 | }
|
---|
| 91 |
|
---|
| 92 |
|
---|
[2430] | 93 | public static int columnidxabsmax(ref double[,] x,
|
---|
| 94 | int i1,
|
---|
| 95 | int i2,
|
---|
| 96 | int j)
|
---|
| 97 | {
|
---|
| 98 | int result = 0;
|
---|
| 99 | int i = 0;
|
---|
| 100 | double a = 0;
|
---|
[2154] | 101 |
|
---|
[2430] | 102 | result = i1;
|
---|
| 103 | a = Math.Abs(x[result,j]);
|
---|
| 104 | for(i=i1+1; i<=i2; i++)
|
---|
[2154] | 105 | {
|
---|
[2563] | 106 | if( (double)(Math.Abs(x[i,j]))>(double)(Math.Abs(x[result,j])) )
|
---|
[2430] | 107 | {
|
---|
| 108 | result = i;
|
---|
| 109 | }
|
---|
[2154] | 110 | }
|
---|
[2430] | 111 | return result;
|
---|
[2154] | 112 | }
|
---|
| 113 |
|
---|
| 114 |
|
---|
[2430] | 115 | public static int rowidxabsmax(ref double[,] x,
|
---|
| 116 | int j1,
|
---|
| 117 | int j2,
|
---|
| 118 | int i)
|
---|
[2154] | 119 | {
|
---|
[2430] | 120 | int result = 0;
|
---|
| 121 | int j = 0;
|
---|
| 122 | double a = 0;
|
---|
[2154] | 123 |
|
---|
[2430] | 124 | result = j1;
|
---|
| 125 | a = Math.Abs(x[i,result]);
|
---|
| 126 | for(j=j1+1; j<=j2; j++)
|
---|
[2154] | 127 | {
|
---|
[2563] | 128 | if( (double)(Math.Abs(x[i,j]))>(double)(Math.Abs(x[i,result])) )
|
---|
[2430] | 129 | {
|
---|
| 130 | result = j;
|
---|
| 131 | }
|
---|
[2154] | 132 | }
|
---|
[2430] | 133 | return result;
|
---|
[2154] | 134 | }
|
---|
| 135 |
|
---|
| 136 |
|
---|
[2430] | 137 | public static double upperhessenberg1norm(ref double[,] a,
|
---|
| 138 | int i1,
|
---|
| 139 | int i2,
|
---|
| 140 | int j1,
|
---|
| 141 | int j2,
|
---|
| 142 | ref double[] work)
|
---|
[2154] | 143 | {
|
---|
[2430] | 144 | double result = 0;
|
---|
| 145 | int i = 0;
|
---|
| 146 | int j = 0;
|
---|
[2154] | 147 |
|
---|
[2430] | 148 | System.Diagnostics.Debug.Assert(i2-i1==j2-j1, "UpperHessenberg1Norm: I2-I1<>J2-J1!");
|
---|
| 149 | for(j=j1; j<=j2; j++)
|
---|
[2154] | 150 | {
|
---|
[2430] | 151 | work[j] = 0;
|
---|
[2154] | 152 | }
|
---|
[2430] | 153 | for(i=i1; i<=i2; i++)
|
---|
[2154] | 154 | {
|
---|
[2430] | 155 | for(j=Math.Max(j1, j1+i-i1-1); j<=j2; j++)
|
---|
| 156 | {
|
---|
| 157 | work[j] = work[j]+Math.Abs(a[i,j]);
|
---|
| 158 | }
|
---|
[2154] | 159 | }
|
---|
[2430] | 160 | result = 0;
|
---|
| 161 | for(j=j1; j<=j2; j++)
|
---|
[2154] | 162 | {
|
---|
[2430] | 163 | result = Math.Max(result, work[j]);
|
---|
[2154] | 164 | }
|
---|
[2430] | 165 | return result;
|
---|
[2154] | 166 | }
|
---|
| 167 |
|
---|
| 168 |
|
---|
[2430] | 169 | public static void copymatrix(ref double[,] a,
|
---|
| 170 | int is1,
|
---|
| 171 | int is2,
|
---|
| 172 | int js1,
|
---|
| 173 | int js2,
|
---|
| 174 | ref double[,] b,
|
---|
| 175 | int id1,
|
---|
| 176 | int id2,
|
---|
| 177 | int jd1,
|
---|
| 178 | int jd2)
|
---|
| 179 | {
|
---|
| 180 | int isrc = 0;
|
---|
| 181 | int idst = 0;
|
---|
| 182 | int i_ = 0;
|
---|
| 183 | int i1_ = 0;
|
---|
[2154] | 184 |
|
---|
[2430] | 185 | if( is1>is2 | js1>js2 )
|
---|
[2154] | 186 | {
|
---|
[2430] | 187 | return;
|
---|
[2154] | 188 | }
|
---|
[2430] | 189 | System.Diagnostics.Debug.Assert(is2-is1==id2-id1, "CopyMatrix: different sizes!");
|
---|
| 190 | System.Diagnostics.Debug.Assert(js2-js1==jd2-jd1, "CopyMatrix: different sizes!");
|
---|
| 191 | for(isrc=is1; isrc<=is2; isrc++)
|
---|
| 192 | {
|
---|
| 193 | idst = isrc-is1+id1;
|
---|
| 194 | i1_ = (js1) - (jd1);
|
---|
| 195 | for(i_=jd1; i_<=jd2;i_++)
|
---|
| 196 | {
|
---|
| 197 | b[idst,i_] = a[isrc,i_+i1_];
|
---|
| 198 | }
|
---|
| 199 | }
|
---|
[2154] | 200 | }
|
---|
| 201 |
|
---|
| 202 |
|
---|
[2430] | 203 | public static void inplacetranspose(ref double[,] a,
|
---|
| 204 | int i1,
|
---|
| 205 | int i2,
|
---|
| 206 | int j1,
|
---|
| 207 | int j2,
|
---|
| 208 | ref double[] work)
|
---|
| 209 | {
|
---|
| 210 | int i = 0;
|
---|
| 211 | int j = 0;
|
---|
| 212 | int ips = 0;
|
---|
| 213 | int jps = 0;
|
---|
| 214 | int l = 0;
|
---|
| 215 | int i_ = 0;
|
---|
| 216 | int i1_ = 0;
|
---|
[2154] | 217 |
|
---|
| 218 | if( i1>i2 | j1>j2 )
|
---|
| 219 | {
|
---|
| 220 | return;
|
---|
| 221 | }
|
---|
[2430] | 222 | System.Diagnostics.Debug.Assert(i1-i2==j1-j2, "InplaceTranspose error: incorrect array size!");
|
---|
| 223 | for(i=i1; i<=i2-1; i++)
|
---|
[2154] | 224 | {
|
---|
[2430] | 225 | j = j1+i-i1;
|
---|
| 226 | ips = i+1;
|
---|
| 227 | jps = j1+ips-i1;
|
---|
| 228 | l = i2-i;
|
---|
| 229 | i1_ = (ips) - (1);
|
---|
| 230 | for(i_=1; i_<=l;i_++)
|
---|
[2154] | 231 | {
|
---|
[2430] | 232 | work[i_] = a[i_+i1_,j];
|
---|
[2154] | 233 | }
|
---|
[2430] | 234 | i1_ = (jps) - (ips);
|
---|
| 235 | for(i_=ips; i_<=i2;i_++)
|
---|
[2154] | 236 | {
|
---|
[2430] | 237 | a[i_,j] = a[i,i_+i1_];
|
---|
[2154] | 238 | }
|
---|
[2430] | 239 | i1_ = (1) - (jps);
|
---|
| 240 | for(i_=jps; i_<=j2;i_++)
|
---|
[2154] | 241 | {
|
---|
[2430] | 242 | a[i,i_] = work[i_+i1_];
|
---|
[2154] | 243 | }
|
---|
| 244 | }
|
---|
| 245 | }
|
---|
[2430] | 246 |
|
---|
| 247 |
|
---|
| 248 | public static void copyandtranspose(ref double[,] a,
|
---|
| 249 | int is1,
|
---|
| 250 | int is2,
|
---|
| 251 | int js1,
|
---|
| 252 | int js2,
|
---|
| 253 | ref double[,] b,
|
---|
| 254 | int id1,
|
---|
| 255 | int id2,
|
---|
| 256 | int jd1,
|
---|
| 257 | int jd2)
|
---|
[2154] | 258 | {
|
---|
[2430] | 259 | int isrc = 0;
|
---|
| 260 | int jdst = 0;
|
---|
| 261 | int i_ = 0;
|
---|
| 262 | int i1_ = 0;
|
---|
| 263 |
|
---|
| 264 | if( is1>is2 | js1>js2 )
|
---|
[2154] | 265 | {
|
---|
| 266 | return;
|
---|
| 267 | }
|
---|
[2430] | 268 | System.Diagnostics.Debug.Assert(is2-is1==jd2-jd1, "CopyAndTranspose: different sizes!");
|
---|
| 269 | System.Diagnostics.Debug.Assert(js2-js1==id2-id1, "CopyAndTranspose: different sizes!");
|
---|
| 270 | for(isrc=is1; isrc<=is2; isrc++)
|
---|
[2154] | 271 | {
|
---|
[2430] | 272 | jdst = isrc-is1+jd1;
|
---|
| 273 | i1_ = (js1) - (id1);
|
---|
| 274 | for(i_=id1; i_<=id2;i_++)
|
---|
[2154] | 275 | {
|
---|
[2430] | 276 | b[i_,jdst] = a[isrc,i_+i1_];
|
---|
[2154] | 277 | }
|
---|
| 278 | }
|
---|
[2430] | 279 | }
|
---|
| 280 |
|
---|
| 281 |
|
---|
| 282 | public static void matrixvectormultiply(ref double[,] a,
|
---|
| 283 | int i1,
|
---|
| 284 | int i2,
|
---|
| 285 | int j1,
|
---|
| 286 | int j2,
|
---|
| 287 | bool trans,
|
---|
| 288 | ref double[] x,
|
---|
| 289 | int ix1,
|
---|
| 290 | int ix2,
|
---|
| 291 | double alpha,
|
---|
| 292 | ref double[] y,
|
---|
| 293 | int iy1,
|
---|
| 294 | int iy2,
|
---|
| 295 | double beta)
|
---|
| 296 | {
|
---|
| 297 | int i = 0;
|
---|
| 298 | double v = 0;
|
---|
| 299 | int i_ = 0;
|
---|
| 300 | int i1_ = 0;
|
---|
| 301 |
|
---|
| 302 | if( !trans )
|
---|
[2154] | 303 | {
|
---|
[2430] | 304 |
|
---|
| 305 | //
|
---|
| 306 | // y := alpha*A*x + beta*y;
|
---|
| 307 | //
|
---|
| 308 | if( i1>i2 | j1>j2 )
|
---|
[2154] | 309 | {
|
---|
[2430] | 310 | return;
|
---|
[2154] | 311 | }
|
---|
[2430] | 312 | System.Diagnostics.Debug.Assert(j2-j1==ix2-ix1, "MatrixVectorMultiply: A and X dont match!");
|
---|
| 313 | System.Diagnostics.Debug.Assert(i2-i1==iy2-iy1, "MatrixVectorMultiply: A and Y dont match!");
|
---|
| 314 |
|
---|
| 315 | //
|
---|
| 316 | // beta*y
|
---|
| 317 | //
|
---|
[2563] | 318 | if( (double)(beta)==(double)(0) )
|
---|
[2430] | 319 | {
|
---|
| 320 | for(i=iy1; i<=iy2; i++)
|
---|
| 321 | {
|
---|
| 322 | y[i] = 0;
|
---|
| 323 | }
|
---|
| 324 | }
|
---|
| 325 | else
|
---|
| 326 | {
|
---|
| 327 | for(i_=iy1; i_<=iy2;i_++)
|
---|
| 328 | {
|
---|
| 329 | y[i_] = beta*y[i_];
|
---|
| 330 | }
|
---|
| 331 | }
|
---|
| 332 |
|
---|
| 333 | //
|
---|
| 334 | // alpha*A*x
|
---|
| 335 | //
|
---|
| 336 | for(i=i1; i<=i2; i++)
|
---|
| 337 | {
|
---|
| 338 | i1_ = (ix1)-(j1);
|
---|
| 339 | v = 0.0;
|
---|
| 340 | for(i_=j1; i_<=j2;i_++)
|
---|
| 341 | {
|
---|
| 342 | v += a[i,i_]*x[i_+i1_];
|
---|
| 343 | }
|
---|
| 344 | y[iy1+i-i1] = y[iy1+i-i1]+alpha*v;
|
---|
| 345 | }
|
---|
[2154] | 346 | }
|
---|
[2430] | 347 | else
|
---|
[2154] | 348 | {
|
---|
[2430] | 349 |
|
---|
| 350 | //
|
---|
| 351 | // y := alpha*A'*x + beta*y;
|
---|
| 352 | //
|
---|
| 353 | if( i1>i2 | j1>j2 )
|
---|
[2154] | 354 | {
|
---|
[2430] | 355 | return;
|
---|
[2154] | 356 | }
|
---|
[2430] | 357 | System.Diagnostics.Debug.Assert(i2-i1==ix2-ix1, "MatrixVectorMultiply: A and X dont match!");
|
---|
| 358 | System.Diagnostics.Debug.Assert(j2-j1==iy2-iy1, "MatrixVectorMultiply: A and Y dont match!");
|
---|
| 359 |
|
---|
| 360 | //
|
---|
| 361 | // beta*y
|
---|
| 362 | //
|
---|
[2563] | 363 | if( (double)(beta)==(double)(0) )
|
---|
[2430] | 364 | {
|
---|
| 365 | for(i=iy1; i<=iy2; i++)
|
---|
| 366 | {
|
---|
| 367 | y[i] = 0;
|
---|
| 368 | }
|
---|
| 369 | }
|
---|
| 370 | else
|
---|
| 371 | {
|
---|
| 372 | for(i_=iy1; i_<=iy2;i_++)
|
---|
| 373 | {
|
---|
| 374 | y[i_] = beta*y[i_];
|
---|
| 375 | }
|
---|
| 376 | }
|
---|
| 377 |
|
---|
| 378 | //
|
---|
| 379 | // alpha*A'*x
|
---|
| 380 | //
|
---|
| 381 | for(i=i1; i<=i2; i++)
|
---|
| 382 | {
|
---|
| 383 | v = alpha*x[ix1+i-i1];
|
---|
| 384 | i1_ = (j1) - (iy1);
|
---|
| 385 | for(i_=iy1; i_<=iy2;i_++)
|
---|
| 386 | {
|
---|
| 387 | y[i_] = y[i_] + v*a[i,i_+i1_];
|
---|
| 388 | }
|
---|
| 389 | }
|
---|
[2154] | 390 | }
|
---|
| 391 | }
|
---|
| 392 |
|
---|
| 393 |
|
---|
[2430] | 394 | public static double pythag2(double x,
|
---|
| 395 | double y)
|
---|
| 396 | {
|
---|
| 397 | double result = 0;
|
---|
| 398 | double w = 0;
|
---|
| 399 | double xabs = 0;
|
---|
| 400 | double yabs = 0;
|
---|
| 401 | double z = 0;
|
---|
[2154] | 402 |
|
---|
[2430] | 403 | xabs = Math.Abs(x);
|
---|
| 404 | yabs = Math.Abs(y);
|
---|
| 405 | w = Math.Max(xabs, yabs);
|
---|
| 406 | z = Math.Min(xabs, yabs);
|
---|
[2563] | 407 | if( (double)(z)==(double)(0) )
|
---|
[2430] | 408 | {
|
---|
| 409 | result = w;
|
---|
| 410 | }
|
---|
| 411 | else
|
---|
| 412 | {
|
---|
| 413 | result = w*Math.Sqrt(1+AP.Math.Sqr(z/w));
|
---|
| 414 | }
|
---|
| 415 | return result;
|
---|
[2154] | 416 | }
|
---|
| 417 |
|
---|
| 418 |
|
---|
[2430] | 419 | public static void matrixmatrixmultiply(ref double[,] a,
|
---|
| 420 | int ai1,
|
---|
| 421 | int ai2,
|
---|
| 422 | int aj1,
|
---|
| 423 | int aj2,
|
---|
| 424 | bool transa,
|
---|
| 425 | ref double[,] b,
|
---|
| 426 | int bi1,
|
---|
| 427 | int bi2,
|
---|
| 428 | int bj1,
|
---|
| 429 | int bj2,
|
---|
| 430 | bool transb,
|
---|
| 431 | double alpha,
|
---|
| 432 | ref double[,] c,
|
---|
| 433 | int ci1,
|
---|
| 434 | int ci2,
|
---|
| 435 | int cj1,
|
---|
| 436 | int cj2,
|
---|
| 437 | double beta,
|
---|
| 438 | ref double[] work)
|
---|
| 439 | {
|
---|
| 440 | int arows = 0;
|
---|
| 441 | int acols = 0;
|
---|
| 442 | int brows = 0;
|
---|
| 443 | int bcols = 0;
|
---|
| 444 | int crows = 0;
|
---|
| 445 | int ccols = 0;
|
---|
| 446 | int i = 0;
|
---|
| 447 | int j = 0;
|
---|
| 448 | int k = 0;
|
---|
| 449 | int l = 0;
|
---|
| 450 | int r = 0;
|
---|
| 451 | double v = 0;
|
---|
| 452 | int i_ = 0;
|
---|
| 453 | int i1_ = 0;
|
---|
[2154] | 454 |
|
---|
[2430] | 455 |
|
---|
| 456 | //
|
---|
| 457 | // Setup
|
---|
| 458 | //
|
---|
| 459 | if( !transa )
|
---|
[2154] | 460 | {
|
---|
[2430] | 461 | arows = ai2-ai1+1;
|
---|
| 462 | acols = aj2-aj1+1;
|
---|
[2154] | 463 | }
|
---|
[2430] | 464 | else
|
---|
[2154] | 465 | {
|
---|
[2430] | 466 | arows = aj2-aj1+1;
|
---|
| 467 | acols = ai2-ai1+1;
|
---|
| 468 | }
|
---|
| 469 | if( !transb )
|
---|
| 470 | {
|
---|
| 471 | brows = bi2-bi1+1;
|
---|
| 472 | bcols = bj2-bj1+1;
|
---|
| 473 | }
|
---|
| 474 | else
|
---|
| 475 | {
|
---|
| 476 | brows = bj2-bj1+1;
|
---|
| 477 | bcols = bi2-bi1+1;
|
---|
| 478 | }
|
---|
| 479 | System.Diagnostics.Debug.Assert(acols==brows, "MatrixMatrixMultiply: incorrect matrix sizes!");
|
---|
| 480 | if( arows<=0 | acols<=0 | brows<=0 | bcols<=0 )
|
---|
| 481 | {
|
---|
| 482 | return;
|
---|
| 483 | }
|
---|
| 484 | crows = arows;
|
---|
| 485 | ccols = bcols;
|
---|
| 486 |
|
---|
| 487 | //
|
---|
| 488 | // Test WORK
|
---|
| 489 | //
|
---|
| 490 | i = Math.Max(arows, acols);
|
---|
| 491 | i = Math.Max(brows, i);
|
---|
| 492 | i = Math.Max(i, bcols);
|
---|
| 493 | work[1] = 0;
|
---|
| 494 | work[i] = 0;
|
---|
| 495 |
|
---|
| 496 | //
|
---|
| 497 | // Prepare C
|
---|
| 498 | //
|
---|
[2563] | 499 | if( (double)(beta)==(double)(0) )
|
---|
[2430] | 500 | {
|
---|
| 501 | for(i=ci1; i<=ci2; i++)
|
---|
[2154] | 502 | {
|
---|
[2430] | 503 | for(j=cj1; j<=cj2; j++)
|
---|
| 504 | {
|
---|
| 505 | c[i,j] = 0;
|
---|
| 506 | }
|
---|
[2154] | 507 | }
|
---|
| 508 | }
|
---|
[2430] | 509 | else
|
---|
[2154] | 510 | {
|
---|
[2430] | 511 | for(i=ci1; i<=ci2; i++)
|
---|
[2154] | 512 | {
|
---|
| 513 | for(i_=cj1; i_<=cj2;i_++)
|
---|
| 514 | {
|
---|
[2430] | 515 | c[i,i_] = beta*c[i,i_];
|
---|
[2154] | 516 | }
|
---|
| 517 | }
|
---|
| 518 | }
|
---|
[2430] | 519 |
|
---|
| 520 | //
|
---|
| 521 | // A*B
|
---|
| 522 | //
|
---|
| 523 | if( !transa & !transb )
|
---|
[2154] | 524 | {
|
---|
[2430] | 525 | for(l=ai1; l<=ai2; l++)
|
---|
[2154] | 526 | {
|
---|
[2430] | 527 | for(r=bi1; r<=bi2; r++)
|
---|
[2154] | 528 | {
|
---|
[2430] | 529 | v = alpha*a[l,aj1+r-bi1];
|
---|
| 530 | k = ci1+l-ai1;
|
---|
| 531 | i1_ = (bj1) - (cj1);
|
---|
| 532 | for(i_=cj1; i_<=cj2;i_++)
|
---|
[2154] | 533 | {
|
---|
[2430] | 534 | c[k,i_] = c[k,i_] + v*b[r,i_+i1_];
|
---|
[2154] | 535 | }
|
---|
| 536 | }
|
---|
| 537 | }
|
---|
| 538 | return;
|
---|
| 539 | }
|
---|
[2430] | 540 |
|
---|
| 541 | //
|
---|
| 542 | // A*B'
|
---|
| 543 | //
|
---|
| 544 | if( !transa & transb )
|
---|
[2154] | 545 | {
|
---|
[2430] | 546 | if( arows*acols<brows*bcols )
|
---|
[2154] | 547 | {
|
---|
| 548 | for(r=bi1; r<=bi2; r++)
|
---|
| 549 | {
|
---|
[2430] | 550 | for(l=ai1; l<=ai2; l++)
|
---|
[2154] | 551 | {
|
---|
[2430] | 552 | i1_ = (bj1)-(aj1);
|
---|
| 553 | v = 0.0;
|
---|
| 554 | for(i_=aj1; i_<=aj2;i_++)
|
---|
| 555 | {
|
---|
| 556 | v += a[l,i_]*b[r,i_+i1_];
|
---|
| 557 | }
|
---|
| 558 | c[ci1+l-ai1,cj1+r-bi1] = c[ci1+l-ai1,cj1+r-bi1]+alpha*v;
|
---|
[2154] | 559 | }
|
---|
| 560 | }
|
---|
[2430] | 561 | return;
|
---|
[2154] | 562 | }
|
---|
[2430] | 563 | else
|
---|
[2154] | 564 | {
|
---|
[2430] | 565 | for(l=ai1; l<=ai2; l++)
|
---|
[2154] | 566 | {
|
---|
[2430] | 567 | for(r=bi1; r<=bi2; r++)
|
---|
| 568 | {
|
---|
| 569 | i1_ = (bj1)-(aj1);
|
---|
| 570 | v = 0.0;
|
---|
| 571 | for(i_=aj1; i_<=aj2;i_++)
|
---|
| 572 | {
|
---|
| 573 | v += a[l,i_]*b[r,i_+i1_];
|
---|
| 574 | }
|
---|
| 575 | c[ci1+l-ai1,cj1+r-bi1] = c[ci1+l-ai1,cj1+r-bi1]+alpha*v;
|
---|
| 576 | }
|
---|
[2154] | 577 | }
|
---|
[2430] | 578 | return;
|
---|
[2154] | 579 | }
|
---|
| 580 | }
|
---|
[2430] | 581 |
|
---|
| 582 | //
|
---|
| 583 | // A'*B
|
---|
| 584 | //
|
---|
| 585 | if( transa & !transb )
|
---|
[2154] | 586 | {
|
---|
[2430] | 587 | for(l=aj1; l<=aj2; l++)
|
---|
[2154] | 588 | {
|
---|
[2430] | 589 | for(r=bi1; r<=bi2; r++)
|
---|
[2154] | 590 | {
|
---|
[2430] | 591 | v = alpha*a[ai1+r-bi1,l];
|
---|
| 592 | k = ci1+l-aj1;
|
---|
| 593 | i1_ = (bj1) - (cj1);
|
---|
| 594 | for(i_=cj1; i_<=cj2;i_++)
|
---|
[2154] | 595 | {
|
---|
[2430] | 596 | c[k,i_] = c[k,i_] + v*b[r,i_+i1_];
|
---|
[2154] | 597 | }
|
---|
| 598 | }
|
---|
| 599 | }
|
---|
| 600 | return;
|
---|
| 601 | }
|
---|
[2430] | 602 |
|
---|
| 603 | //
|
---|
| 604 | // A'*B'
|
---|
| 605 | //
|
---|
| 606 | if( transa & transb )
|
---|
[2154] | 607 | {
|
---|
[2430] | 608 | if( arows*acols<brows*bcols )
|
---|
[2154] | 609 | {
|
---|
[2430] | 610 | for(r=bi1; r<=bi2; r++)
|
---|
[2154] | 611 | {
|
---|
[2430] | 612 | for(i=1; i<=crows; i++)
|
---|
| 613 | {
|
---|
| 614 | work[i] = 0.0;
|
---|
| 615 | }
|
---|
| 616 | for(l=ai1; l<=ai2; l++)
|
---|
| 617 | {
|
---|
| 618 | v = alpha*b[r,bj1+l-ai1];
|
---|
| 619 | k = cj1+r-bi1;
|
---|
| 620 | i1_ = (aj1) - (1);
|
---|
| 621 | for(i_=1; i_<=crows;i_++)
|
---|
| 622 | {
|
---|
| 623 | work[i_] = work[i_] + v*a[l,i_+i1_];
|
---|
| 624 | }
|
---|
| 625 | }
|
---|
| 626 | i1_ = (1) - (ci1);
|
---|
| 627 | for(i_=ci1; i_<=ci2;i_++)
|
---|
| 628 | {
|
---|
| 629 | c[i_,k] = c[i_,k] + work[i_+i1_];
|
---|
| 630 | }
|
---|
[2154] | 631 | }
|
---|
[2430] | 632 | return;
|
---|
| 633 | }
|
---|
| 634 | else
|
---|
| 635 | {
|
---|
| 636 | for(l=aj1; l<=aj2; l++)
|
---|
[2154] | 637 | {
|
---|
[2430] | 638 | k = ai2-ai1+1;
|
---|
| 639 | i1_ = (ai1) - (1);
|
---|
[2154] | 640 | for(i_=1; i_<=k;i_++)
|
---|
| 641 | {
|
---|
[2430] | 642 | work[i_] = a[i_+i1_,l];
|
---|
[2154] | 643 | }
|
---|
[2430] | 644 | for(r=bi1; r<=bi2; r++)
|
---|
| 645 | {
|
---|
| 646 | i1_ = (bj1)-(1);
|
---|
| 647 | v = 0.0;
|
---|
| 648 | for(i_=1; i_<=k;i_++)
|
---|
| 649 | {
|
---|
| 650 | v += work[i_]*b[r,i_+i1_];
|
---|
| 651 | }
|
---|
| 652 | c[ci1+l-aj1,cj1+r-bi1] = c[ci1+l-aj1,cj1+r-bi1]+alpha*v;
|
---|
| 653 | }
|
---|
[2154] | 654 | }
|
---|
[2430] | 655 | return;
|
---|
[2154] | 656 | }
|
---|
| 657 | }
|
---|
| 658 | }
|
---|
| 659 | }
|
---|
| 660 | }
|
---|