doc/html/Teuchos__BLAS_8cpp_source.html

 // @HEADER

 // *****************************************************************************

 //                    Teuchos: Common Tools Package

 //

 // Copyright 2004 NTESS and the Teuchos contributors.

 // SPDX-License-Identifier: BSD-3-Clause

 // *****************************************************************************

 // @HEADER


 #include "Teuchos_BLAS.hpp"

 #include "Teuchos_BLAS_wrappers.hpp"


 /* for INTEL_CXML, the second arg may need to be changed to 'one'.  If so

 the appropriate declaration of one will need to be added back into

 functions that include the macro:

 */


 namespace {

 #if defined (INTEL_CXML)

         unsigned int one=1;

 #endif

 } // namespace


 #ifdef CHAR_MACRO

 #undef CHAR_MACRO

 #endif

 #if defined (INTEL_CXML)

 #define CHAR_MACRO(char_var) &char_var, one

 #else

 #define CHAR_MACRO(char_var) &char_var

 #endif


 const char Teuchos::ESideChar[] = {'L' , 'R' };

 const char Teuchos::ETranspChar[] = {'N' , 'T' , 'C' };

 const char Teuchos::EUploChar[] = {'U' , 'L' };

 const char Teuchos::EDiagChar[] = {'U' , 'N' };

 const char Teuchos::ETypeChar[] = {'G' , 'L', 'U', 'H', 'B', 'Q', 'Z' };

 //const char Teuchos::EFactChar[] = {'F', 'N' };

 //const char Teuchos::ENormChar[] = {'O', 'I' };

 //const char Teuchos::ECompQChar[] = {'N', 'I', 'V' };

 //const char Teuchos::EJobChar[] = {'E', 'V', 'B' };

 //const char Teuchos::EJobSChar[] = {'E', 'S' };

 //const char Teuchos::EJobVSChar[] = {'V', 'N' };

 //const char Teuchos::EHowmnyChar[] = {'A', 'S' };

 //const char Teuchos::ECMachChar[] = {'E', 'S', 'B', 'P', 'N', 'R', 'M', 'U', 'L', 'O' };

 //const char Teuchos::ESortChar[] = {'N', 'S'};


 namespace {


 template<typename Scalar>

 Scalar generic_dot(const int& n, const Scalar* x, const int& incx,

   const Scalar* y, const int& incy)

 {

   typedef Teuchos::ScalarTraits<Scalar> ST;

   Scalar dot = 0.0;

   if (incx==1 && incy==1) {

     for (int i = 0; i < n; ++i)

       dot += (*x++)*ST::conjugate(*y++);

   }

   else {

     if (incx < 0)

       x = x - incx*(n-1);

     if (incy < 0)

       y = y - incy*(n-1);

     for (int i = 0; i < n; ++i, x+=incx, y+=incy)

       dot += (*x)*ST::conjugate(*y);

   }

   return dot;

 }


 } // namespace


 namespace Teuchos {


 //Explicitly instantiating these templates for windows due to an issue with

 //resolving them when linking dlls.

 #ifdef _MSC_VER

 #  ifdef HAVE_TEUCHOS_COMPLEX

      template class BLAS<long int, std::complex<float> >;

      template class BLAS<long int, std::complex<double> >;

 #  endif

      template class BLAS<long int, float>;

      template class BLAS<long int, double>;

 #endif


   // *************************** BLAS<int,float> DEFINITIONS ******************************


   void BLAS<int, float>::ROTG(float* da, float* db, float* c, float* s) const

   { SROTG_F77(da, db, c, s ); }


   void BLAS<int, float>::ROT(const int& n, float* dx, const int& incx, float* dy, const int& incy, float* c, float* s) const

   { SROT_F77(&n, dx, &incx, dy, &incy, c, s); }


   float BLAS<int, float>::ASUM(const int& n, const float* x, const int& incx) const

   {

 #if defined(HAVE_TEUCHOS_BLASFLOAT_APPLE_VECLIB_BUGFIX)

     return cblas_sasum(n, x, incx);

 #elif defined(HAVE_TEUCHOS_BLASFLOAT)

     float tmp = SASUM_F77(&n, x, &incx);

     return tmp;

 #else

     typedef ScalarTraits<float> ST;

     float sum = 0.0;

     if (incx == 1) {

       for (int i = 0; i < n; ++i)

         sum += ST::magnitude(*x++);

     }

     else {

       for (int i = 0; i < n; ++i, x+=incx)

         sum += ST::magnitude(*x);

     }

     return sum;

 #endif

   }


   void BLAS<int, float>::AXPY(const int& n, const float& alpha, const float* x, const int& incx, float* y, const int& incy) const

   { SAXPY_F77(&n, &alpha, x, &incx, y, &incy); }


   void BLAS<int, float>::COPY(const int& n, const float* x, const int& incx, float* y, const int& incy) const

   { SCOPY_F77(&n, x, &incx, y, &incy); }


   float BLAS<int, float>::DOT(const int& n, const float* x, const int& incx, const float* y, const int& incy) const

   {

 #if defined(HAVE_TEUCHOS_BLASFLOAT_APPLE_VECLIB_BUGFIX)

     return cblas_sdot(n, x, incx, y, incy);

 #elif defined(HAVE_TEUCHOS_BLASFLOAT)

     return SDOT_F77(&n, x, &incx, y, &incy);

 #else

     return generic_dot(n, x, incx, y, incy);

 #endif

   }


   int BLAS<int, float>::IAMAX(const int& n, const float* x, const int& incx) const

   { return ISAMAX_F77(&n, x, &incx); }


   float BLAS<int, float>::NRM2(const int& n, const float* x, const int& incx) const

   {

 #if defined(HAVE_TEUCHOS_BLASFLOAT_APPLE_VECLIB_BUGFIX)

     return cblas_snrm2(n, x, incx);

 #elif defined(HAVE_TEUCHOS_BLASFLOAT)

     return SNRM2_F77(&n, x, &incx);

 #else

     return ScalarTraits<float>::squareroot(generic_dot(n, x, incx, x, incx));

 #endif

   }


   void BLAS<int, float>::SCAL(const int& n, const float& alpha, float* x, const int& incx) const

   { SSCAL_F77(&n, &alpha, x, &incx); }


   void BLAS<int, float>::GEMV(ETransp trans, const int& m, const int& n, const float& alpha, const float* A, const int& lda, const float* x, const int& incx, const float& beta, float* y, const int& incy) const

   { SGEMV_F77(CHAR_MACRO(ETranspChar[trans]), &m, &n, &alpha, A, &lda, x, &incx, &beta, y, &incy); }


   void BLAS<int, float>::GER(const int& m, const int& n, const float& alpha, const float* x, const int& incx, const float* y, const int& incy, float* A, const int& lda) const

   { SGER_F77(&m, &n, &alpha, x, &incx, y, &incy, A, &lda); }


   void BLAS<int, float>::TRMV(EUplo uplo, ETransp trans, EDiag diag, const int& n, const float* A, const int& lda, float* x, const int& incx) const

   { STRMV_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), CHAR_MACRO(EDiagChar[diag]), &n, A, &lda, x, &incx); }


   void BLAS<int, float>::GEMM(ETransp transa, ETransp transb, const int& m, const int& n, const int& k, const float& alpha, const float* A, const int& lda, const float* B, const int& ldb, const float& beta, float* C, const int& ldc) const

   { SGEMM_F77(CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(ETranspChar[transb]), &m, &n, &k, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, float>::SWAP(const int& n, float* const x, const int& incx, float* const y, const int& incy) const

   {

     SSWAP_F77 (&n, x, &incx, y, &incy);

   }


   void BLAS<int, float>::SYMM(ESide side, EUplo uplo, const int& m, const int& n, const float& alpha, const float* A, const int& lda, const float* B, const int& ldb, const float& beta, float* C, const int& ldc) const

   { SSYMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), &m, &n, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, float>::SYRK(EUplo uplo, ETransp trans, const int& n, const int& k, const float& alpha, const float* A, const int& lda, const float& beta, float* C, const int& ldc) const

   { SSYRK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, float>::HERK(EUplo uplo, ETransp trans, const int& n, const int& k, const float& alpha, const float* A, const int& lda, const float& beta, float* C, const int& ldc) const

   { SSYRK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, float>::TRMM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const float& alpha, const float* A, const int& lda, float* B, const int& ldb) const

   { STRMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


   void BLAS<int, float>::TRSM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const float& alpha, const float* A, const int& lda, float* B, const int& ldb) const

   { STRSM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


   // *************************** BLAS<int,double> DEFINITIONS ******************************


   void BLAS<int, double>::ROTG(double* da, double* db, double* c, double* s) const

   { DROTG_F77(da, db, c, s); }


   void BLAS<int, double>::ROT(const int& n, double* dx, const int& incx, double* dy, const int& incy, double* c, double* s) const

   { DROT_F77(&n, dx, &incx, dy, &incy, c, s); }


   double BLAS<int, double>::ASUM(const int& n, const double* x, const int& incx) const

   { return DASUM_F77(&n, x, &incx); }


   void BLAS<int, double>::AXPY(const int& n, const double& alpha, const double* x, const int& incx, double* y, const int& incy) const

   { DAXPY_F77(&n, &alpha, x, &incx, y, &incy); }


   void BLAS<int, double>::COPY(const int& n, const double* x, const int& incx, double* y, const int& incy) const

   { DCOPY_F77(&n, x, &incx, y, &incy); }


   double BLAS<int, double>::DOT(const int& n, const double* x, const int& incx, const double* y, const int& incy) const

   {

     return DDOT_F77(&n, x, &incx, y, &incy);

   }


   int BLAS<int, double>::IAMAX(const int& n, const double* x, const int& incx) const

   { return IDAMAX_F77(&n, x, &incx); }


   double BLAS<int, double>::NRM2(const int& n, const double* x, const int& incx) const

   { return DNRM2_F77(&n, x, &incx); }


   void BLAS<int, double>::SCAL(const int& n, const double& alpha, double* x, const int& incx) const

   { DSCAL_F77(&n, &alpha, x, &incx); }


   void BLAS<int, double>::GEMV(ETransp trans, const int& m, const int& n, const double& alpha, const double* A, const int& lda, const double* x, const int& incx, const double& beta, double* y, const int& incy) const

   { DGEMV_F77(CHAR_MACRO(ETranspChar[trans]), &m, &n, &alpha, A, &lda, x, &incx, &beta, y, &incy); }


   void BLAS<int, double>::GER(const int& m, const int& n, const double& alpha, const double* x, const int& incx, const double* y, const int& incy, double* A, const int& lda) const

   { DGER_F77(&m, &n, &alpha, x, &incx, y, &incy, A, &lda); }


   void BLAS<int, double>::TRMV(EUplo uplo, ETransp trans, EDiag diag, const int& n, const double* A, const int& lda, double* x, const int& incx) const

   { DTRMV_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), CHAR_MACRO(EDiagChar[diag]), &n, A, &lda, x, &incx); }


   void BLAS<int, double>::GEMM(ETransp transa, ETransp transb, const int& m, const int& n, const int& k, const double& alpha, const double* A, const int& lda, const double* B, const int& ldb, const double& beta, double* C, const int& ldc) const

   { DGEMM_F77(CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(ETranspChar[transb]), &m, &n, &k, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, double>::SWAP(const int& n, double* const x, const int& incx, double* const y, const int& incy) const

   {

     DSWAP_F77 (&n, x, &incx, y, &incy);

   }


   void BLAS<int, double>::SYMM(ESide side, EUplo uplo, const int& m, const int& n, const double& alpha, const double* A, const int& lda, const double* B, const int& ldb, const double& beta, double* C, const int& ldc) const

   { DSYMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), &m, &n, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, double>::SYRK(EUplo uplo, ETransp trans, const int& n, const int& k, const double& alpha, const double* A, const int& lda, const double& beta, double* C, const int& ldc) const

   { DSYRK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, double>::HERK(EUplo uplo, ETransp trans, const int& n, const int& k, const double& alpha, const double* A, const int& lda, const double& beta, double* C, const int& ldc) const

   { DSYRK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, double>::TRMM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const double& alpha, const double* A, const int& lda, double* B, const int& ldb) const

   { DTRMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


   void BLAS<int, double>::TRSM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const double& alpha, const double* A, const int& lda, double* B, const int& ldb) const

   { DTRSM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


 #ifdef HAVE_TEUCHOS_COMPLEX


   // *************************** BLAS<int,std::complex<float> > DEFINITIONS ******************************


   void BLAS<int, std::complex<float> >::ROTG(std::complex<float>* da, std::complex<float>* db, float* c, std::complex<float>* s) const

   { CROTG_F77(da, db, c, s ); }


   void BLAS<int, std::complex<float> >::ROT(const int& n, std::complex<float>* dx, const int& incx, std::complex<float>* dy, const int& incy, float* c, std::complex<float>* s) const

   { CROT_F77(&n, dx, &incx, dy, &incy, c, s); }


   float BLAS<int, std::complex<float> >::ASUM(const int& n, const std::complex<float>* x, const int& incx) const

   {

 #if defined(HAVE_TEUCHOS_BLASFLOAT_APPLE_VECLIB_BUGFIX)

     return cblas_scasum(n, x, incx);

 #elif defined(HAVE_TEUCHOS_BLASFLOAT_DOUBLE_RETURN)

     return (float) SCASUM_F77(&n, x, &incx);

 #elif defined(HAVE_TEUCHOS_BLASFLOAT)

     return SCASUM_F77(&n, x, &incx);

 #else // Wow, you just plain don't have this routine.

     // mfh 01 Feb 2013: See www.netlib.org/blas/scasum.f.

     // I've enhanced this by accumulating in double precision.

     double result = 0;

     if (incx == 1) {

       for (int i = 0; i < n; ++i) {

         result += std::abs (std::real (x[i])) + std::abs (std::imag (x[i]));

       }

     } else {

       const int nincx = n * incx;

       for (int i = 0; i < nincx; i += incx) {

         result += std::abs (std::real (x[i])) + std::abs (std::imag (x[i]));

       }

     }

     return static_cast<float> (result);

 #endif

   }


   void BLAS<int, std::complex<float> >::AXPY(const int& n, const std::complex<float> alpha, const std::complex<float>* x, const int& incx, std::complex<float>* y, const int& incy) const

   { CAXPY_F77(&n, &alpha, x, &incx, y, &incy); }


   void BLAS<int, std::complex<float> >::COPY(const int& n, const std::complex<float>* x, const int& incx, std::complex<float>* y, const int& incy) const

   { CCOPY_F77(&n, x, &incx, y, &incy); }


   std::complex<float> BLAS<int, std::complex<float> >::DOT(const int& n, const std::complex<float>* x, const int& incx, const std::complex<float>* y, const int& incy) const

   {

 #if defined(HAVE_TEUCHOS_BLASFLOAT_APPLE_VECLIB_BUGFIX)

     std::complex<float> z;

     cblas_cdotc_sub(n,x,incx,y,incy,&z);

     return z;

 #elif defined(HAVE_COMPLEX_BLAS_PROBLEM) && defined(HAVE_FIXABLE_COMPLEX_BLAS_PROBLEM)

     std::complex<float> z;

     CDOT_F77(&z, &n, x, &incx, y, &incy);

     return z;

 #elif defined(HAVE_TEUCHOS_BLASFLOAT)

     Teuchos_Complex_float_type_name z = CDOT_F77(&n, x, &incx, y, &incy);

     return TEUCHOS_BLAS_CONVERT_COMPLEX_FORTRAN_TO_CXX(float, z);

 #else // Wow, you just plain don't have this routine.

     // mfh 01 Feb 2013: See www.netlib.org/blas/cdotc.f.

     // I've enhanced this by accumulating in double precision.

     std::complex<double> result (0, 0);

     if (n >= 0) {

       if (incx == 1 && incy == 1) {

         for (int i = 0; i < n; ++i) {

           result += std::conj (x[i]) * y[i];

         }

       } else {

         int ix = 0;

         int iy = 0;

         if (incx < 0) {

           ix = (1-n) * incx;

         }

         if (incy < 0) {

           iy = (1-n) * incy;

         }

         for (int i = 0; i < n; ++i) {

           result += std::conj (x[ix]) * y[iy];

           ix += incx;

           iy += incy;

         }

       }

     }

     return static_cast<std::complex<float> > (result);

 #endif

   }


   int BLAS<int, std::complex<float> >::IAMAX(const int& n, const std::complex<float>* x, const int& incx) const

   { return ICAMAX_F77(&n, x, &incx); }


   float BLAS<int, std::complex<float> >::NRM2(const int& n, const std::complex<float>* x, const int& incx) const

   {

 #if defined(HAVE_TEUCHOS_BLASFLOAT_APPLE_VECLIB_BUGFIX)

     return cblas_scnrm2(n, x, incx);

 #elif defined(HAVE_TEUCHOS_BLASFLOAT_DOUBLE_RETURN)

     return (float) SCNRM2_F77(&n, x, &incx);

 #elif defined(HAVE_TEUCHOS_BLASFLOAT)

     return SCNRM2_F77(&n, x, &incx);

 #else // Wow, you just plain don't have this routine.

     // mfh 01 Feb 2013: See www.netlib.org/blas/scnrm2.f.

     // I've enhanced this by accumulating in double precision.

     if (n < 1 || incx < 1) {

       return 0;

     } else {

       double scale = 0;

       double ssq = 1;


       const int upper = 1 + (n-1)*incx;

       for (int ix = 0; ix < upper; ix += incx) {

         // The reference BLAS implementation cleverly scales the

         // intermediate result. so that even if the square of the norm

         // would overflow, computing the norm itself does not.  Hence,

         // "ssq" for "scaled square root."

         if (std::real (x[ix]) != 0) {

           const double temp = std::abs (std::real (x[ix]));

           if (scale < temp) {

             const double scale_over_temp = scale / temp;

             ssq = 1 + ssq * scale_over_temp*scale_over_temp;

             // New scaling factor: biggest (in magnitude) real or imaginary part seen thus far.

             scale = temp;

           } else {

             const double temp_over_scale = temp / scale;

             ssq = ssq + temp_over_scale*temp_over_scale;

           }

         }

         if (std::imag (x[ix]) != 0) {

           const double temp = std::abs (std::imag (x[ix]));

           if (scale < temp) {

             const double scale_over_temp = scale / temp;

             ssq = 1 + ssq * scale_over_temp*scale_over_temp;

             // New scaling factor: biggest (in magnitude) real or imaginary part seen thus far.

             scale = temp;

           } else {

             const double temp_over_scale = temp / scale;

             ssq = ssq + temp_over_scale*temp_over_scale;

           }

         }

       }

       return static_cast<float> (scale * std::sqrt (ssq));

     }

 #endif

   }


   void BLAS<int, std::complex<float> >::SCAL(const int& n, const std::complex<float> alpha, std::complex<float>* x, const int& incx) const

   { CSCAL_F77(&n, &alpha, x, &incx); }


   void BLAS<int, std::complex<float> >::GEMV(ETransp trans, const int& m, const int& n, const std::complex<float> alpha, const std::complex<float>* A, const int& lda, const std::complex<float>* x, const int& incx, const std::complex<float> beta, std::complex<float>* y, const int& incy) const

   { CGEMV_F77(CHAR_MACRO(ETranspChar[trans]), &m, &n, &alpha, A, &lda, x, &incx, &beta, y, &incy); }


   void BLAS<int, std::complex<float> >::GER(const int& m, const int& n, const std::complex<float> alpha, const std::complex<float>* x, const int& incx, const std::complex<float>* y, const int& incy, std::complex<float>* A, const int& lda) const

   { CGER_F77(&m, &n, &alpha, x, &incx, y, &incy, A, &lda); }


   void BLAS<int, std::complex<float> >::TRMV(EUplo uplo, ETransp trans, EDiag diag, const int& n, const std::complex<float>* A, const int& lda, std::complex<float>* x, const int& incx) const

   { CTRMV_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), CHAR_MACRO(EDiagChar[diag]), &n, A, &lda, x, &incx); }


   void BLAS<int, std::complex<float> >::GEMM(ETransp transa, ETransp transb, const int& m, const int& n, const int& k, const std::complex<float> alpha, const std::complex<float>* A, const int& lda, const std::complex<float>* B, const int& ldb, const std::complex<float> beta, std::complex<float>* C, const int& ldc) const

   { CGEMM_F77(CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(ETranspChar[transb]), &m, &n, &k, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, std::complex<float> >::SWAP(const int& n, std::complex<float>* const x, const int& incx, std::complex<float>* const y, const int& incy) const

   {

     CSWAP_F77 (&n, x, &incx, y, &incy);

   }


   void BLAS<int, std::complex<float> >::SYMM(ESide side, EUplo uplo, const int& m, const int& n, const std::complex<float> alpha, const std::complex<float>* A, const int& lda, const std::complex<float>* B, const int& ldb, const std::complex<float> beta, std::complex<float>* C, const int& ldc) const

   { CSYMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), &m, &n, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, std::complex<float> >::SYRK(EUplo uplo, ETransp trans, const int& n, const int& k, const std::complex<float> alpha, const std::complex<float>* A, const int& lda, const std::complex<float> beta, std::complex<float>* C, const int& ldc) const

   { CSYRK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, std::complex<float> >::HERK(EUplo uplo, ETransp trans, const int& n, const int& k, const std::complex<float> alpha, const std::complex<float>* A, const int& lda, const std::complex<float> beta, std::complex<float>* C, const int& ldc) const

   { CHERK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, std::complex<float> >::TRMM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const std::complex<float> alpha, const std::complex<float>* A, const int& lda, std::complex<float>* B, const int& ldb) const

   { CTRMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


   void BLAS<int, std::complex<float> >::TRSM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const std::complex<float> alpha, const std::complex<float>* A, const int& lda, std::complex<float>* B, const int& ldb) const

   { CTRSM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


   // *************************** BLAS<int,std::complex<double> > DEFINITIONS ******************************


   void BLAS<int, std::complex<double> >::ROTG(std::complex<double>* da, std::complex<double>* db, double* c, std::complex<double>* s) const

   { ZROTG_F77(da, db, c, s); }


   void BLAS<int, std::complex<double> >::ROT(const int& n, std::complex<double>* dx, const int& incx, std::complex<double>* dy, const int& incy, double* c, std::complex<double>* s) const

   { ZROT_F77(&n, dx, &incx, dy, &incy, c, s); }


   double BLAS<int, std::complex<double> >::ASUM(const int& n, const std::complex<double>* x, const int& incx) const

   { return ZASUM_F77(&n, x, &incx); }


   void BLAS<int, std::complex<double> >::AXPY(const int& n, const std::complex<double> alpha, const std::complex<double>* x, const int& incx, std::complex<double>* y, const int& incy) const

   { ZAXPY_F77(&n, &alpha, x, &incx, y, &incy); }


   void BLAS<int, std::complex<double> >::COPY(const int& n, const std::complex<double>* x, const int& incx, std::complex<double>* y, const int& incy) const

   { ZCOPY_F77(&n, x, &incx, y, &incy); }


   std::complex<double> BLAS<int, std::complex<double> >::DOT(const int& n, const std::complex<double>* x, const int& incx, const std::complex<double>* y, const int& incy) const

   {

 #if defined(HAVE_TEUCHOS_BLASFLOAT_APPLE_VECLIB_BUGFIX)

     std::complex<double> z;

     cblas_zdotc_sub(n,x,incx,y,incy,&z);

     return z;

 #elif defined(HAVE_COMPLEX_BLAS_PROBLEM)

 #  if defined(HAVE_FIXABLE_COMPLEX_BLAS_PROBLEM)

     std::complex<double> z;

     ZDOT_F77(&z, &n, x, &incx, y, &incy);

     return z;

 #  else

     // mfh 01 Feb 2013: Your complex BLAS is broken, but the problem

     // doesn't have the easy workaround.  I'll just reimplement the

     // missing routine here.  See www.netlib.org/blas/zdotc.f.

     std::complex<double> ztemp (0, 0);

     if (n > 0) {

       if (incx == 1 && incy == 1) {

         for (int i = 0; i < n; ++i) {

           ztemp += std::conj (x[i]) * y[i];

         }

       } else {

         int ix = 0;

         int iy = 0;

         if (incx < 0) {

           ix = (1-n)*incx;

         }

         if (incy < 0) {

           iy = (1-n)*incy;

         }

         for (int i = 0; i < n; ++i) {

           ztemp += std::conj (x[ix]) * y[iy];

           ix += incx;

           iy += incy;

         }

       }

     }

     return ztemp;


 #  endif // defined(HAVE_FIXABLE_COMPLEX_BLAS_PROBLEM)

 #else

     Teuchos_Complex_double_type_name z = ZDOT_F77(&n, x, &incx, y, &incy);

     return TEUCHOS_BLAS_CONVERT_COMPLEX_FORTRAN_TO_CXX(double, z);

 #endif

   }


   int BLAS<int, std::complex<double> >::IAMAX(const int& n, const std::complex<double>* x, const int& incx) const

   { return IZAMAX_F77(&n, x, &incx); }


   double BLAS<int, std::complex<double> >::NRM2(const int& n, const std::complex<double>* x, const int& incx) const

   { return ZNRM2_F77(&n, x, &incx); }


   void BLAS<int, std::complex<double> >::SCAL(const int& n, const std::complex<double> alpha, std::complex<double>* x, const int& incx) const

   { ZSCAL_F77(&n, &alpha, x, &incx); }


   void BLAS<int, std::complex<double> >::GEMV(ETransp trans, const int& m, const int& n, const std::complex<double> alpha, const std::complex<double>* A, const int& lda, const std::complex<double>* x, const int& incx, const std::complex<double> beta, std::complex<double>* y, const int& incy) const

   { ZGEMV_F77(CHAR_MACRO(ETranspChar[trans]), &m, &n, &alpha, A, &lda, x, &incx, &beta, y, &incy); }


   void BLAS<int, std::complex<double> >::GER(const int& m, const int& n, const std::complex<double> alpha, const std::complex<double>* x, const int& incx, const std::complex<double>* y, const int& incy, std::complex<double>* A, const int& lda) const

   { ZGER_F77(&m, &n, &alpha, x, &incx, y, &incy, A, &lda); }


   void BLAS<int, std::complex<double> >::TRMV(EUplo uplo, ETransp trans, EDiag diag, const int& n, const std::complex<double>* A, const int& lda, std::complex<double>* x, const int& incx) const

   { ZTRMV_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), CHAR_MACRO(EDiagChar[diag]), &n, A, &lda, x, &incx); }


   void BLAS<int, std::complex<double> >::GEMM(ETransp transa, ETransp transb, const int& m, const int& n, const int& k, const std::complex<double> alpha, const std::complex<double>* A, const int& lda, const std::complex<double>* B, const int& ldb, const std::complex<double> beta, std::complex<double>* C, const int& ldc) const

   { ZGEMM_F77(CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(ETranspChar[transb]), &m, &n, &k, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, std::complex<double> >::SWAP(const int& n, std::complex<double>* const x, const int& incx, std::complex<double>* const y, const int& incy) const

   {

     ZSWAP_F77 (&n, x, &incx, y, &incy);

   }


   void BLAS<int, std::complex<double> >::SYMM(ESide side, EUplo uplo, const int& m, const int& n, const std::complex<double> alpha, const std::complex<double>* A, const int& lda, const std::complex<double> *B, const int& ldb, const std::complex<double> beta, std::complex<double> *C, const int& ldc) const

   { ZSYMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), &m, &n, &alpha, A, &lda, B, &ldb, &beta, C, &ldc); }


   void BLAS<int, std::complex<double> >::SYRK(EUplo uplo, ETransp trans, const int& n, const int& k, const std::complex<double> alpha, const std::complex<double>* A, const int& lda, const std::complex<double> beta, std::complex<double>* C, const int& ldc) const

   { ZSYRK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, std::complex<double> >::HERK(EUplo uplo, ETransp trans, const int& n, const int& k, const std::complex<double> alpha, const std::complex<double>* A, const int& lda, const std::complex<double> beta, std::complex<double>* C, const int& ldc) const

   { ZHERK_F77(CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[trans]), &n, &k, &alpha, A, &lda, &beta, C, &ldc); }


   void BLAS<int, std::complex<double> >::TRMM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const std::complex<double> alpha, const std::complex<double>* A, const int& lda, std::complex<double>* B, const int& ldb) const

   { ZTRMM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


   void BLAS<int, std::complex<double> >::TRSM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const int& m, const int& n, const std::complex<double> alpha, const std::complex<double>* A, const int& lda, std::complex<double>* B, const int& ldb) const

   { ZTRSM_F77(CHAR_MACRO(ESideChar[side]), CHAR_MACRO(EUploChar[uplo]), CHAR_MACRO(ETranspChar[transa]), CHAR_MACRO(EDiagChar[diag]), &m, &n, &alpha, A, &lda, B, &ldb); }


 #endif // HAVE_TEUCHOS_COMPLEX


 }

Teuchos::DefaultBLASImpl::TRSM
void TRSM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const OrdinalType &m, const OrdinalType &n, const alpha_type alpha, const A_type *A, const OrdinalType &lda, ScalarType *B, const OrdinalType &ldb) const
Solves the matrix equations: op(A)*X=alpha*B or X*op(A)=alpha*B where X and B are m by n matrices...
Definition: Teuchos_BLAS.hpp:1930

Teuchos::DefaultBLASImpl::GER
void GER(const OrdinalType &m, const OrdinalType &n, const alpha_type alpha, const x_type *x, const OrdinalType &incx, const y_type *y, const OrdinalType &incy, ScalarType *A, const OrdinalType &lda) const
Performs the rank 1 operation: A &lt;- alpha*x*y&#39;+A.
Definition: Teuchos_BLAS.hpp:1034

Teuchos_Complex_double_type_name
#define Teuchos_Complex_double_type_name
Definition: Teuchos_BLAS_wrappers.hpp:44

Teuchos::DefaultBLASImpl::AXPY
void AXPY(const OrdinalType &n, const alpha_type alpha, const x_type *x, const OrdinalType &incx, ScalarType *y, const OrdinalType &incy) const
Perform the operation: y &lt;- y+alpha*x.
Definition: Teuchos_BLAS.hpp:561

DTRMV_F77
void PREFIX DTRMV_F77(Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, const int *n, const double *a, const int *lda, double *x, const int *incx)

B
Definition: core/test/dyn_cast/cxx_main.cpp:16

DROTG_F77
void PREFIX DROTG_F77(double *da, double *db, double *c, double *s)

Teuchos::DefaultBLASImpl::TRMV
void TRMV(EUplo uplo, ETransp trans, EDiag diag, const OrdinalType &n, const A_type *A, const OrdinalType &lda, ScalarType *x, const OrdinalType &incx) const
Performs the matrix-vector operation: x &lt;- A*x or x &lt;- A&#39;*x where A is a unit/non-unit n by n upper/low...
Definition: Teuchos_BLAS.hpp:839

DGEMM_F77
void PREFIX DGEMM_F77(Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const int *k, const double *alpha, const double *a, const int *lda, const double *b, const int *ldb, const double *beta, double *c, const int *ldc)

DGEMV_F77
void PREFIX DGEMV_F77(Teuchos_fcd, const int *m, const int *n, const double *alpha, const double A[], const int *lda, const double x[], const int *incx, const double *beta, double y[], const int *incy)

ISAMAX_F77
int PREFIX ISAMAX_F77(const int *n, const float *x, const int *incx)

Teuchos_BLAS.hpp
Templated interface class to BLAS routines.

Teuchos::DefaultBLASImpl::GEMV
void GEMV(ETransp trans, const OrdinalType &m, const OrdinalType &n, const alpha_type alpha, const A_type *A, const OrdinalType &lda, const x_type *x, const OrdinalType &incx, const beta_type beta, ScalarType *y, const OrdinalType &incy) const
Performs the matrix-vector operation: y &lt;- alpha*A*x+beta*y or y &lt;- alpha*A&#39;*x+beta*y where A is a gene...
Definition: Teuchos_BLAS.hpp:686

Teuchos::DefaultBLASImpl::ROT
void ROT(const OrdinalType &n, ScalarType *dx, const OrdinalType &incx, ScalarType *dy, const OrdinalType &incy, MagnitudeType *c, ScalarType *s) const
Applies a Givens plane rotation.
Definition: Teuchos_BLAS.hpp:495

DROT_F77
void PREFIX DROT_F77(const int *n, double *dx, const int *incx, double *dy, const int *incy, double *c, double *s)

SGEMV_F77
void PREFIX SGEMV_F77(Teuchos_fcd, const int *m, const int *n, const float *alpha, const float A[], const int *lda, const float x[], const int *incx, const float *beta, float y[], const int *incy)

SCOPY_F77
void PREFIX SCOPY_F77(const int *n, const float *x, const int *incx, float *y, const int *incy)

Teuchos::ScalarTraits::squareroot
static T squareroot(T x)
Returns a number of magnitudeType that is the square root of this scalar type x.
Definition: Teuchos_ScalarTraitsDecl.hpp:122

SROTG_F77
void PREFIX SROTG_F77(float *da, float *db, float *c, float *s)

Teuchos_Complex_float_type_name
#define Teuchos_Complex_float_type_name
Definition: Teuchos_BLAS_wrappers.hpp:45

DSCAL_F77
void PREFIX DSCAL_F77(const int *n, const double *alpha, double *x, const int *incx)

DSWAP_F77
void PREFIX DSWAP_F77(const int *const n, double *const x, const int *const incx, double *const y, const int *const incy)

DSYRK_F77
void PREFIX DSYRK_F77(Teuchos_fcd, Teuchos_fcd, const int *n, const int *k, const double *alpha, const double *a, const int *lda, const double *beta, double *c, const int *ldc)

SSYMM_F77
void PREFIX SSYMM_F77(Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const float *alpha, const float *a, const int *lda, const float *b, const int *ldb, const float *beta, float *c, const int *ldc)

C
Definition: core/example/RefCountPtr/cxx_main.cpp:21

Teuchos::BLAS
Templated BLAS wrapper.
Definition: Teuchos_BLAS.hpp:212

A
Definition: core/example/RefCountPtr/cxx_main.cpp:13

Teuchos::DefaultBLASImpl::NRM2
ScalarTraits< ScalarType >::magnitudeType NRM2(const OrdinalType &n, const ScalarType *x, const OrdinalType &incx) const
Compute the 2-norm of the vector x.
Definition: Teuchos_BLAS.hpp:629

Teuchos::DefaultBLASImpl::IAMAX
OrdinalType IAMAX(const OrdinalType &n, const ScalarType *x, const OrdinalType &incx) const
Return the index of the element of x with the maximum magnitude.
Definition: Teuchos_BLAS.hpp:650

Teuchos::DefaultBLASImpl::GEMM
void GEMM(ETransp transa, ETransp transb, const OrdinalType &m, const OrdinalType &n, const OrdinalType &k, const alpha_type alpha, const A_type *A, const OrdinalType &lda, const B_type *B, const OrdinalType &ldb, const beta_type beta, ScalarType *C, const OrdinalType &ldc) const
General matrix-matrix multiply.
Definition: Teuchos_BLAS.hpp:1109

DNRM2_F77
double PREFIX DNRM2_F77(const int *n, const double x[], const int *incx)

Teuchos_BLAS_wrappers.hpp
The Templated BLAS wrappers.

Teuchos::EDiagChar
TEUCHOSNUMERICS_LIB_DLL_EXPORT const char EDiagChar[]
Definition: Teuchos_BLAS.cpp:37

DAXPY_F77
void PREFIX DAXPY_F77(const int *n, const double *alpha, const double x[], const int *incx, double y[], const int *incy)

Teuchos::ScalarTraits
This structure defines some basic traits for a scalar field type.
Definition: Teuchos_ScalarTraitsDecl.hpp:58

SDOT_F77
#define SDOT_F77
Definition: Teuchos_BLAS_wrappers.hpp:100

Teuchos::DefaultBLASImpl::ASUM
ScalarTraits< ScalarType >::magnitudeType ASUM(const OrdinalType &n, const ScalarType *x, const OrdinalType &incx) const
Sum the absolute values of the entries of x.
Definition: Teuchos_BLAS.hpp:582

SSWAP_F77
void PREFIX SSWAP_F77(const int *const n, float *const x, const int *const incx, float *const y, const int *const incy)

Teuchos::DefaultBLASImpl::COPY
void COPY(const OrdinalType &n, const ScalarType *x, const OrdinalType &incx, ScalarType *y, const OrdinalType &incy) const
Copy the vector x to the vector y.
Definition: Teuchos_BLAS.hpp:540

SGER_F77
void PREFIX SGER_F77(const int *m, const int *n, const float *alpha, const float *x, const int *incx, const float *y, const int *incy, float *a, const int *lda)

Teuchos::EUploChar
TEUCHOSNUMERICS_LIB_DLL_EXPORT const char EUploChar[]
Definition: Teuchos_BLAS.cpp:36

DTRSM_F77
void PREFIX DTRSM_F77(Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const double *alpha, const double *a, const int *lda, double *b, const int *ldb)

DASUM_F77
double PREFIX DASUM_F77(const int *n, const double x[], const int *incx)

SSYRK_F77
void PREFIX SSYRK_F77(Teuchos_fcd, Teuchos_fcd, const int *n, const int *k, const float *alpha, const float *a, const int *lda, const float *beta, float *c, const int *ldc)

Teuchos::ETypeChar
TEUCHOSNUMERICS_LIB_DLL_EXPORT const char ETypeChar[]
Definition: Teuchos_BLAS.cpp:38

Teuchos::DefaultBLASImpl::DOT
ScalarType DOT(const OrdinalType &n, const x_type *x, const OrdinalType &incx, const y_type *y, const OrdinalType &incy) const
Form the dot product of the vectors x and y.
Definition: Teuchos_BLAS.hpp:606

STRMV_F77
void PREFIX STRMV_F77(Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, const int *n, const float *a, const int *lda, float *x, const int *incx)

SSCAL_F77
void PREFIX SSCAL_F77(const int *n, const float *alpha, float *x, const int *incx)

Teuchos::ESideChar
TEUCHOSNUMERICS_LIB_DLL_EXPORT const char ESideChar[]
Definition: Teuchos_BLAS.cpp:34

IDAMAX_F77
int PREFIX IDAMAX_F77(const int *n, const double *x, const int *incx)

SGEMM_F77
void PREFIX SGEMM_F77(Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const int *k, const float *alpha, const float *a, const int *lda, const float *b, const int *ldb, const float *beta, float *c, const int *ldc)

CHAR_MACRO
#define CHAR_MACRO(char_var)
Definition: Teuchos_BLAS.cpp:30

Teuchos::DefaultBLASImpl::SYMM
void SYMM(ESide side, EUplo uplo, const OrdinalType &m, const OrdinalType &n, const alpha_type alpha, const A_type *A, const OrdinalType &lda, const B_type *B, const OrdinalType &ldb, const beta_type beta, ScalarType *C, const OrdinalType &ldc) const
Performs the matrix-matrix operation: C &lt;- alpha*A*B+beta*C or C &lt;- alpha*B*A+beta*C where A is an m ...
Definition: Teuchos_BLAS.hpp:1393

Teuchos::DefaultBLASImpl::TRMM
void TRMM(ESide side, EUplo uplo, ETransp transa, EDiag diag, const OrdinalType &m, const OrdinalType &n, const alpha_type alpha, const A_type *A, const OrdinalType &lda, ScalarType *B, const OrdinalType &ldb) const
Performs the matrix-matrix operation: B &lt;- alpha*op(A)*B or B &lt;- alpha*B*op(A) where op(A) is an unit...
Definition: Teuchos_BLAS.hpp:1697

Teuchos::DefaultBLASImpl::SCAL
void SCAL(const OrdinalType &n, const ScalarType &alpha, ScalarType *x, const OrdinalType &incx) const
Scale the vector x by the constant alpha.
Definition: Teuchos_BLAS.hpp:522

Teuchos::DefaultBLASImpl::ROTG
void ROTG(ScalarType *da, ScalarType *db, rotg_c_type *c, ScalarType *s) const
Computes a Givens plane rotation.
Definition: Teuchos_BLAS.hpp:485

SASUM_F77
#define SASUM_F77
Definition: Teuchos_BLAS_wrappers.hpp:102

Teuchos::EUplo
EUplo
Definition: Teuchos_BLAS_types.hpp:65

SAXPY_F77
void PREFIX SAXPY_F77(const int *n, const float *alpha, const float x[], const int *incx, float y[], const int *incy)

Teuchos::ESide
ESide
Definition: Teuchos_BLAS_types.hpp:54

Teuchos::ETranspChar
TEUCHOSNUMERICS_LIB_DLL_EXPORT const char ETranspChar[]
Definition: Teuchos_BLAS.cpp:35

Teuchos::DefaultBLASImpl::SYRK
void SYRK(EUplo uplo, ETransp trans, const OrdinalType &n, const OrdinalType &k, const alpha_type alpha, const A_type *A, const OrdinalType &lda, const beta_type beta, ScalarType *C, const OrdinalType &ldc) const
Performs the symmetric rank k operation: C &lt;- alpha*A*A&#39;+beta*C or C &lt;- alpha*A&#39;*A+beta*C, where alpha and beta are scalars, C is an n by n symmetric matrix and A is an n by k matrix in the first case or k by n matrix in the second case.
Definition: Teuchos_BLAS.hpp:1523

STRMM_F77
void PREFIX STRMM_F77(Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const float *alpha, const float *a, const int *lda, float *b, const int *ldb)

DTRMM_F77
void PREFIX DTRMM_F77(Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const double *alpha, const double *a, const int *lda, double *b, const int *ldb)

SROT_F77
void PREFIX SROT_F77(const int *n, float *dx, const int *incx, float *dy, const int *incy, float *c, float *s)

STRSM_F77
void PREFIX STRSM_F77(Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const float *alpha, const float *a, const int *lda, float *b, const int *ldb)

DGER_F77
void PREFIX DGER_F77(const int *m, const int *n, const double *alpha, const double *x, const int *incx, const double *y, const int *incy, double *a, const int *lda)

DCOPY_F77
void PREFIX DCOPY_F77(const int *n, const double *x, const int *incx, double *y, const int *incy)

DDOT_F77
double PREFIX DDOT_F77(const int *n, const double x[], const int *incx, const double y[], const int *incy)

Teuchos::ETransp
ETransp
Definition: Teuchos_BLAS_types.hpp:59

ArrayUnitTestHelpers::n
int n
Definition: Array_UnitTest_helpers.cpp:13

Teuchos::DefaultBLASImpl::SWAP
void SWAP(const OrdinalType &n, ScalarType *const x, const OrdinalType &incx, ScalarType *const y, const OrdinalType &incy) const
Swap the entries of x and y.
Definition: Teuchos_BLAS.hpp:1356

SNRM2_F77
#define SNRM2_F77
Definition: Teuchos_BLAS_wrappers.hpp:101

Teuchos::EDiag
EDiag
Definition: Teuchos_BLAS_types.hpp:71

DSYMM_F77
void PREFIX DSYMM_F77(Teuchos_fcd, Teuchos_fcd, const int *m, const int *n, const double *alpha, const double *a, const int *lda, const double *b, const int *ldb, const double *beta, double *c, const int *ldc)