//===================================================== // File : INTEL_BLAS_interface.hh // Author : L. Plagne // Copyright (C) EDF R&D, lun sep 30 14:23:29 CEST 2002 //===================================================== // // This program is free software; you can redistribute it and/or // modify it under the terms of the GNU General Public License // as published by the Free Software Foundation; either version 2 // of the License, or (at your option) any later version. // // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License for more details. // You should have received a copy of the GNU General Public License // along with this program; if not, write to the Free Software // Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. // #ifndef INTEL_BLAS_PRODUIT_MATRICE_VECTEUR_HH #define INTEL_BLAS_PRODUIT_MATRICE_VECTEUR_HH #include "f77_interface.hh" extern "C" { #include "mkl_cblas.h" } template class INTEL_BLAS_interface : public f77_interface_base { public : typedef typename f77_interface_base::gene_matrix gene_matrix; typedef typename f77_interface_base::gene_vector gene_vector; static inline std::string name( void ) { return "INTEL_BLAS"; } static inline void matrix_vector_product(gene_matrix & A, gene_vector & B, gene_vector & X, int N) { cblas_dgemv(CblasColMajor,CblasNoTrans,N,N,1.0,A,N,B,1,0.0,X,1); } static inline void matrix_matrix_product(gene_matrix & A, gene_matrix & B, gene_matrix & X, int N) { cblas_dgemm(CblasColMajor,CblasNoTrans,CblasNoTrans,N,N,N,1.0,A,N,B,N,0.0,X,N); } static inline void ata_product(gene_matrix & A, gene_matrix & X, int N) { cblas_dgemm(CblasColMajor,CblasTrans,CblasNoTrans,N,N,N,1.0,A,N,A,N,0.0,X,N); } static inline void aat_product(gene_matrix & A, gene_matrix & X, int N) { cblas_dgemm(CblasColMajor,CblasNoTrans,CblasTrans,N,N,N,1.0,A,N,A,N,0.0,X,N); } static inline void axpy(real coef, const gene_vector & X, gene_vector & Y, int N) { cblas_daxpy(N,coef,X,1,Y,1); } }; template<> class INTEL_BLAS_interface : public f77_interface_base { public : static inline std::string name() { return "INTEL_BLAS"; } static inline void matrix_vector_product(gene_matrix & A, gene_vector & B, gene_vector & X, int N) { // cblas_sgemv(CblasNoTrans,N,N,1.0,A,N,B,1,0.0,X,1); cblas_sgemv(CblasColMajor,CblasNoTrans,N,N,1.0,A,N,B,1,0.0,X,1); } static inline void matrix_matrix_product(gene_matrix & A, gene_matrix & B, gene_matrix & X, int N) { cblas_sgemm(CblasColMajor,CblasNoTrans,CblasNoTrans,N,N,N,1.0,A,N,B,N,0.0,X,N); } static inline void ata_product(gene_matrix & A, gene_matrix & X, int N) { cblas_sgemm(CblasColMajor,CblasTrans,CblasNoTrans,N,N,N,1.0,A,N,A,N,0.0,X,N); } static inline void aat_product(gene_matrix & A, gene_matrix & X, int N) { cblas_sgemm(CblasColMajor,CblasNoTrans,CblasTrans,N,N,N,1.0,A,N,A,N,0.0,X,N); } static inline void axpy(float coef, const gene_vector & X, gene_vector & Y, int N) { cblas_saxpy(N,coef,X,1,Y,1); } }; #endif