diff options
author | Chen-Pang He <jdh8@ms63.hinet.net> | 2012-09-08 02:06:45 +0800 |
---|---|---|
committer | Chen-Pang He <jdh8@ms63.hinet.net> | 2012-09-08 02:06:45 +0800 |
commit | 1b61aadcbe0f3d8c6898d28b7605347a7643190d (patch) | |
tree | 8644a7530385714f93193c7a824e181271939b9d /blas/double.cpp | |
parent | b0b9b4d6b223cfbfee564427514cd6d693e1c503 (diff) |
Implement SDSDOT with DSDOT and avoid allocating buffers in DSDOT.
Diffstat (limited to 'blas/double.cpp')
-rw-r--r-- | blas/double.cpp | 26 |
1 files changed, 8 insertions, 18 deletions
diff --git a/blas/double.cpp b/blas/double.cpp index 8a3b00175..8fd0709ba 100644 --- a/blas/double.cpp +++ b/blas/double.cpp @@ -19,25 +19,15 @@ #include "level2_real_impl.h" #include "level3_impl.h" -// currently used by DSDOT only -double* cast_vector_to_double(float* x, int n, int incx) +double BLASFUNC(dsdot)(int* n, float* x, int* incx, float* y, int* incy) { - double* ret = new double[n]; - if(incx<0) vector(ret,n) = vector(x,n,-incx).reverse().cast<double>(); - else vector(ret,n) = vector(x,n, incx).cast<double>(); - return ret; -} - -double BLASFUNC(dsdot)(int* n, float* px, int* incx, float* py, int* incy) -{ - if(*n <= 0) return 0; - - double* x = cast_vector_to_double(px, *n, *incx); - double* y = cast_vector_to_double(py, *n, *incy); - double res = vector(x,*n).cwiseProduct(vector(y,*n)).sum(); + if(*n<=0) return 0; - delete[] x; - delete[] y; - return res; + if(*incx==1 && *incy==1) return (vector(x,*n).cast<double>().cwiseProduct(vector(y,*n).cast<double>())).sum(); + else if(*incx>0 && *incy>0) return (vector(x,*n,*incx).cast<double>().cwiseProduct(vector(y,*n,*incy).cast<double>())).sum(); + else if(*incx<0 && *incy>0) return (vector(x,*n,-*incx).reverse().cast<double>().cwiseProduct(vector(y,*n,*incy).cast<double>())).sum(); + else if(*incx>0 && *incy<0) return (vector(x,*n,*incx).cast<double>().cwiseProduct(vector(y,*n,-*incy).reverse().cast<double>())).sum(); + else if(*incx<0 && *incy<0) return (vector(x,*n,-*incx).reverse().cast<double>().cwiseProduct(vector(y,*n,-*incy).reverse().cast<double>())).sum(); + else return 0; } |