#include <ulmblas/level3/pack/trlpack.h>
#include <ulmblas/auxiliary/memorypool.h> #include <ulmblas/auxiliary/printmatrix.h> using namespace ulmBLAS; int main() { static MemoryPool<double> memoryPool; const int m = 10; double *A = memoryPool.allocate(m*m); const int MR = ugemm_mr<double>(); const int mp = (m+MR)/MR; double *A_ = memoryPool.allocate(mp*MR*m); int count = 0; for (int j=0; j<m; ++j) { for (int i=0; i<m; ++i) { A[i+j*m] = ++count; } } printMatrix(m, m, A, 1, m); trlpack(m, false, A, 1, m, A_); printMatrix(MR, mp*m, A_, 1, MR); } |