// // Copyright (c) 2002--2010 // Toon Knapen, Karl Meerbergen, Kresimir Fresl, // Thomas Klimpel and Rutger ter Borg // // Distributed under the Boost Software License, Version 1.0. // (See accompanying file LICENSE_1_0.txt or copy at // http://www.boost.org/LICENSE_1_0.txt) // // THIS FILE IS AUTOMATICALLY GENERATED // PLEASE DO NOT EDIT! // #ifndef BOOST_NUMERIC_BINDINGS_BLAS_LEVEL3_GEMM_HPP #define BOOST_NUMERIC_BINDINGS_BLAS_LEVEL3_GEMM_HPP #include #include #include #include #include #include #include #include #include #include #include #include #include // // The BLAS-backend is selected by defining a pre-processor variable, // which can be one of // * for CBLAS, define BOOST_NUMERIC_BINDINGS_BLAS_CBLAS // * for CUBLAS, define BOOST_NUMERIC_BINDINGS_BLAS_CUBLAS // * netlib-compatible BLAS is the default // #if defined BOOST_NUMERIC_BINDINGS_BLAS_CBLAS #include #include #elif defined BOOST_NUMERIC_BINDINGS_BLAS_CUBLAS #include #include #else #include #include #endif namespace boost { namespace numeric { namespace bindings { namespace blas { // // The detail namespace contains value-type-overloaded functions that // dispatch to the appropriate back-end BLAS-routine. // namespace detail { #if defined BOOST_NUMERIC_BINDINGS_BLAS_CBLAS // // Overloaded function for dispatching to // * CBLAS backend, and // * float value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const float alpha, const float* a, const int lda, const float* b, const int ldb, const float beta, float* c, const int ldc ) { cblas_sgemm( cblas_option< Order >::value, cblas_option< TransA >::value, cblas_option< TransB >::value, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc ); } // // Overloaded function for dispatching to // * CBLAS backend, and // * double value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const double alpha, const double* a, const int lda, const double* b, const int ldb, const double beta, double* c, const int ldc ) { cblas_dgemm( cblas_option< Order >::value, cblas_option< TransA >::value, cblas_option< TransB >::value, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc ); } // // Overloaded function for dispatching to // * CBLAS backend, and // * complex value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const std::complex alpha, const std::complex* a, const int lda, const std::complex* b, const int ldb, const std::complex beta, std::complex* c, const int ldc ) { cblas_cgemm( cblas_option< Order >::value, cblas_option< TransA >::value, cblas_option< TransB >::value, m, n, k, &alpha, a, lda, b, ldb, &beta, c, ldc ); } // // Overloaded function for dispatching to // * CBLAS backend, and // * complex value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const std::complex alpha, const std::complex* a, const int lda, const std::complex* b, const int ldb, const std::complex beta, std::complex* c, const int ldc ) { cblas_zgemm( cblas_option< Order >::value, cblas_option< TransA >::value, cblas_option< TransB >::value, m, n, k, &alpha, a, lda, b, ldb, &beta, c, ldc ); } #elif defined BOOST_NUMERIC_BINDINGS_BLAS_CUBLAS // // Overloaded function for dispatching to // * CUBLAS backend, and // * float value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const float alpha, const float* a, const int lda, const float* b, const int ldb, const float beta, float* c, const int ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); cublasSgemm( blas_option< TransA >::value, blas_option< TransB >::value, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc ); } // // Overloaded function for dispatching to // * CUBLAS backend, and // * double value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const double alpha, const double* a, const int lda, const double* b, const int ldb, const double beta, double* c, const int ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); cublasDgemm( blas_option< TransA >::value, blas_option< TransB >::value, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc ); } // // Overloaded function for dispatching to // * CUBLAS backend, and // * complex value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const std::complex alpha, const std::complex* a, const int lda, const std::complex* b, const int ldb, const std::complex beta, std::complex* c, const int ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); cublasCgemm( blas_option< TransA >::value, blas_option< TransB >::value, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc ); } // // Overloaded function for dispatching to // * CUBLAS backend, and // * complex value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const int m, const int n, const int k, const std::complex alpha, const std::complex* a, const int lda, const std::complex* b, const int ldb, const std::complex beta, std::complex* c, const int ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); cublasZgemm( blas_option< TransA >::value, blas_option< TransB >::value, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc ); } #else // // Overloaded function for dispatching to // * netlib-compatible BLAS backend (the default), and // * float value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const fortran_int_t m, const fortran_int_t n, const fortran_int_t k, const float alpha, const float* a, const fortran_int_t lda, const float* b, const fortran_int_t ldb, const float beta, float* c, const fortran_int_t ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); BLAS_SGEMM( &blas_option< TransA >::value, &blas_option< TransB >::value, &m, &n, &k, &alpha, a, &lda, b, &ldb, &beta, c, &ldc ); } // // Overloaded function for dispatching to // * netlib-compatible BLAS backend (the default), and // * double value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const fortran_int_t m, const fortran_int_t n, const fortran_int_t k, const double alpha, const double* a, const fortran_int_t lda, const double* b, const fortran_int_t ldb, const double beta, double* c, const fortran_int_t ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); BLAS_DGEMM( &blas_option< TransA >::value, &blas_option< TransB >::value, &m, &n, &k, &alpha, a, &lda, b, &ldb, &beta, c, &ldc ); } // // Overloaded function for dispatching to // * netlib-compatible BLAS backend (the default), and // * complex value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const fortran_int_t m, const fortran_int_t n, const fortran_int_t k, const std::complex alpha, const std::complex* a, const fortran_int_t lda, const std::complex* b, const fortran_int_t ldb, const std::complex beta, std::complex* c, const fortran_int_t ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); BLAS_CGEMM( &blas_option< TransA >::value, &blas_option< TransB >::value, &m, &n, &k, &alpha, a, &lda, b, &ldb, &beta, c, &ldc ); } // // Overloaded function for dispatching to // * netlib-compatible BLAS backend (the default), and // * complex value-type. // template< typename Order, typename TransA, typename TransB > inline void gemm( const Order, const TransA, const TransB, const fortran_int_t m, const fortran_int_t n, const fortran_int_t k, const std::complex alpha, const std::complex* a, const fortran_int_t lda, const std::complex* b, const fortran_int_t ldb, const std::complex beta, std::complex* c, const fortran_int_t ldc ) { BOOST_STATIC_ASSERT( (is_same::value) ); BLAS_ZGEMM( &blas_option< TransA >::value, &blas_option< TransB >::value, &m, &n, &k, &alpha, a, &lda, b, &ldb, &beta, c, &ldc ); } #endif } // namespace detail // // Value-type based template class. Use this class if you need a type // for dispatching to gemm. // template< typename Value > struct gemm_impl { typedef Value value_type; typedef typename remove_imaginary< Value >::type real_type; typedef void result_type; // // Static member function that // * Deduces the required arguments for dispatching to BLAS, and // * Asserts that most arguments make sense. // template< typename MatrixA, typename MatrixB, typename MatrixC > static result_type invoke( const value_type alpha, const MatrixA& a, const MatrixB& b, const value_type beta, MatrixC& c ) { namespace bindings = ::boost::numeric::bindings; typedef typename result_of::data_order< MatrixC >::type order; typedef typename result_of::trans_tag< MatrixB, order >::type transb; typedef typename result_of::trans_tag< MatrixA, order >::type transa; BOOST_STATIC_ASSERT( (is_same< typename remove_const< typename bindings::value_type< MatrixA >::type >::type, typename remove_const< typename bindings::value_type< MatrixB >::type >::type >::value) ); BOOST_STATIC_ASSERT( (is_same< typename remove_const< typename bindings::value_type< MatrixA >::type >::type, typename remove_const< typename bindings::value_type< MatrixC >::type >::type >::value) ); BOOST_STATIC_ASSERT( (bindings::has_linear_array< MatrixA >::value) ); BOOST_STATIC_ASSERT( (bindings::has_linear_array< MatrixB >::value) ); BOOST_STATIC_ASSERT( (bindings::has_linear_array< MatrixC >::value) ); BOOST_STATIC_ASSERT( (bindings::is_mutable< MatrixC >::value) ); BOOST_ASSERT( bindings::size_minor(a) == 1 || bindings::stride_minor(a) == 1 ); BOOST_ASSERT( bindings::size_minor(b) == 1 || bindings::stride_minor(b) == 1 ); BOOST_ASSERT( bindings::size_minor(c) == 1 || bindings::stride_minor(c) == 1 ); detail::gemm( order(), transa(), transb(), bindings::size_row(c), bindings::size_column(c), bindings::size_column(a), alpha, bindings::begin_value(a), bindings::stride_major(a), bindings::begin_value(b), bindings::stride_major(b), beta, bindings::begin_value(c), bindings::stride_major(c) ); } }; // // Functions for direct use. These functions are overloaded for temporaries, // so that wrapped types can still be passed and used for write-access. Calls // to these functions are passed to the gemm_impl classes. In the // documentation, the const-overloads are collapsed to avoid a large number of // prototypes which are very similar. // // // Overloaded function for gemm. Its overload differs for // template< typename MatrixA, typename MatrixB, typename MatrixC > inline typename gemm_impl< typename bindings::value_type< MatrixA >::type >::result_type gemm( const typename bindings::value_type< MatrixA >::type alpha, const MatrixA& a, const MatrixB& b, const typename bindings::value_type< MatrixA >::type beta, MatrixC& c ) { gemm_impl< typename bindings::value_type< MatrixA >::type >::invoke( alpha, a, b, beta, c ); } } // namespace blas } // namespace bindings } // namespace numeric } // namespace boost #endif