1
       2
       3
       4
       5
       6
       7
       8
       9
      10
      11
      12
      13
      14
      15
      16
      17
      18
      19
      20
      21
      22
      23
      24
      25
      26
      27
      28
      29
      30
      31
      32
      33
      34
      35
      36
      37
      38
      39
      40
      41
      42
      43
      44
      45
      46
      47
      48
      49
      50
      51
      52
      53
      54
      55
      56
      57
      58
      59
      60
      61
      62
      63
      64
      65
      66
      67
      68
      69
      70
      71
      72
      73
      74
      75
      76
      77
      78
      79
      80
      81
      82
      83
      84
      85
      86
      87
      88
      89
      90
      91
      92
      93
      94
      95
      96
      97
      98
      99
     100
     101
     102
     103
     104
     105
     106
     107
     108
     109
     110
     111
     112
     113
     114
     115
     116
     117
     118
     119
     120
     121
     122
     123
     124
     125
/*
 *   Copyright (c) 2010, Michael Lehn
 *
 *   All rights reserved.
 *
 *   Redistribution and use in source and binary forms, with or without
 *   modification, are permitted provided that the following conditions
 *   are met:
 *
 *   1) Redistributions of source code must retain the above copyright
 *      notice, this list of conditions and the following disclaimer.
 *   2) Redistributions in binary form must reproduce the above copyright
 *      notice, this list of conditions and the following disclaimer in
 *      the documentation and/or other materials provided with the
 *      distribution.
 *   3) Neither the name of the FLENS development group nor the names of
 *      its contributors may be used to endorse or promote products derived
 *      from this software without specific prior written permission.
 *
 *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#ifndef FLENS_BLAS_LEVEL3_RK_TCC
#define FLENS_BLAS_LEVEL3_RK_TCC

#include <flens/blas/closures/closures.h>
#include <flens/blas/level3/level3.h>
#include <flens/typedefs.h>

namespace flens { namespace blas {

//-- herk
template <typename ALPHA, typename MA, typename BETA, typename MC>
typename RestrictTo<IsGeMatrix<MA>::value
                 && IsHeMatrix<MC>::value,
         void>::Type
rk(Transpose        trans,
   const ALPHA      &alpha,
   const MA         &A,
   const BETA       &beta,
   MC               &&C)
{
    typedef typename RemoveRef<MA>::Type MatrixA;
    typedef typename RemoveRef<MC>::Type MatrixC;

    ASSERT(C.order()==A.order());
    typedef typename MatrixC::IndexType IndexType;

    IndexType n = (trans==NoTrans) ? A.numRows()
                                            : A.numCols();
    IndexType k = (trans==NoTrans) ? A.numCols()
                                            : A.numRows();

    ASSERT((beta==static_cast<BETA>(0)) || (C.dim()==n));
    if (C.dim()!=n) {
        C.resize(n, n);
    }

    ASSERT(C.dim()==((trans==NoTrans) ? A.numRows() : A.numCols()));

#   ifdef HAVE_CXXBLAS_HERK
    cxxblas::herk(C.order(), C.upLo(),
                  trans, n, k, alpha,
                  A.data(), A.leadingDimension(),
                  beta,
                  C.data(), C.leadingDimension());
#   else
    ASSERT(0);
#   endif
}

//-- syrk
template <typename ALPHA, typename MA, typename BETA, typename MC>
typename RestrictTo<IsGeMatrix<MA>::value
                 && IsSyMatrix<MC>::value,
         void>::Type
rk(Transpose trans,
   const ALPHA      &alpha,
   const MA         &A,
   const BETA       &beta,
   MC               &&C)
{
    typedef typename RemoveRef<MA>::Type MatrixA;
    typedef typename RemoveRef<MC>::Type MatrixC;

    ASSERT(C.order()==A.order());

    typedef typename MatrixC::IndexType IndexType;

    IndexType n = (trans==NoTrans) ? A.numRows()
                                            : A.numCols();
    IndexType k = (trans==NoTrans) ? A.numCols()
                                            : A.numRows();

    ASSERT((beta==static_cast<BETA>(0)) || (C.dim()==n));
    if (C.dim()!=n) {
        C.resize(n, n);
    }

    ASSERT(C.dim()==((trans==NoTrans) ? A.numRows() : A.numCols()));

#   ifdef HAVE_CXXBLAS_SYRK
    cxxblas::syrk(C.order(), C.upLo(),
                  trans, n, k, alpha,
                  A.data(), A.leadingDimension(),
                  beta,
                  C.data(), C.leadingDimension());
#   else
    ASSERT(0);
#   endif
}

} } // namespace blas, flens

#endif // FLENS_BLAS_LEVEL3_RK_TCC