Content

TRSM (Triangular Solver)

Single Precision

Double Precision

Complex Single Precision

Complex Double Precision

Raw Results from Benchmarks

$shell> make BLAS_FUNCTIONS=trsm clean
rm -f   strsm_openBLAS dtrsm_openBLAS ctrsm_openBLAS ztrsm_openBLAS  strsm_BLIS dtrsm_BLIS ctrsm_BLIS ztrsm_BLIS  strsm_Eigen dtrsm_Eigen ctrsm_Eigen ztrsm_Eigen  strsm_MKL dtrsm_MKL ctrsm_MKL ztrsm_MKL
$shell> make BLAS_FUNCTIONS=trsm
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath  /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath  /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath  /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath  /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
$shell> ./strsm_MKL > report.strsm_MKL
$shell> ./dtrsm_MKL > report.dtrsm_MKL
$shell> ./ctrsm_MKL > report.ctrsm_MKL
$shell> ./ztrsm_MKL > report.ztrsm_MKL
$shell> ./strsm_Eigen > report.strsm_Eigen
$shell> ./dtrsm_Eigen > report.dtrsm_Eigen
$shell> ./ctrsm_Eigen > report.ctrsm_Eigen
$shell> ./ztrsm_Eigen > report.ztrsm_Eigen
$shell> ./strsm_openBLAS > report.strsm_openBLAS
$shell> ./dtrsm_openBLAS > report.dtrsm_openBLAS
$shell> ./ctrsm_openBLAS > report.ctrsm_openBLAS
$shell> ./ztrsm_openBLAS > report.ztrsm_openBLAS
$shell> ./strsm_BLIS > report.strsm_BLIS
$shell> ./dtrsm_BLIS > report.dtrsm_BLIS
$shell> ./ctrsm_BLIS > report.ctrsm_BLIS
$shell> ./ztrsm_BLIS > report.ztrsm_BLIS
$shell> gnuplot plot.strsm.mflops
$shell> gnuplot plot.dtrsm.mflops
$shell> gnuplot plot.ctrsm.mflops
$shell> gnuplot plot.ztrsm.mflops
$shell> 

Single Precision

$shell> cat report.strsm_MKL
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS              MKL: t    MFLOPS  Residual
    50    50               0.0001   1039.99              0.0031     40.57   1.2e-02
   100   100               0.0002   4353.45              0.0001   7769.16   6.5e-02
   150   150               0.0004   7815.83              0.0004   9334.63   1.8e-01
   200   200               0.0008   9899.64              0.0004  17873.10   3.8e-01
   250   250               0.0015  10598.20              0.0010  15014.28   6.6e-01
   300   300               0.0023  11883.73              0.0019  14192.44   1.0e+00
   350   350               0.0015  28977.09              0.0014  30824.90   1.5e+00
   400   400               0.0021  31171.84              0.0015  43787.69   2.1e+00
   450   450               0.0029  31092.89              0.0024  38519.78   2.9e+00
   500   500               0.0039  32313.13              0.0034  36377.79   3.8e+00
   550   550               0.0050  33368.19              0.0041  40430.62   3.1e+00
   600   600               0.0063  34522.65              0.0048  44930.83   3.7e+00
   650   650               0.0080  34218.99              0.0063  43323.80   4.3e+00
   700   700               0.0098  35110.37              0.0079  43180.97   5.1e+00
   750   750               0.0118  35865.52              0.0099  42715.77   6.0e+00
   800   800               0.0139  36784.86              0.0108  47391.69   6.8e+00
   850   850               0.0170  36161.23              0.0133  46125.20   7.5e+00
   900   900               0.0199  36696.24              0.0159  45766.73   8.5e+00
   950   950               0.0231  37153.58              0.0189  45271.28   9.5e+00
  1000  1000               0.0266  37656.60              0.0206  48585.50   1.1e+01
  1050  1050               0.0311  37164.41              0.0251  46201.82   1.2e+01
  1100  1100               0.0354  37568.47              0.0287  46454.91   1.3e+01
  1150  1150               0.0401  37926.81              0.0329  46162.56   1.4e+01
  1200  1200               0.0449  38477.95              0.0356  48593.62   1.5e+01
  1250  1250               0.0515  37935.10              0.0410  47691.62   1.7e+01
  1300  1300               0.0575  38184.60              0.0456  48167.46   1.8e+01
  1350  1350               0.0640  38446.56              0.0515  47806.23   2.0e+01
  1400  1400               0.0704  38961.63              0.0555  49479.63   2.1e+01
  1450  1450               0.0788  38669.81              0.0623  48972.57   2.3e+01
  1500  1500               0.0865  39000.73              0.0689  48971.50   2.5e+01
  1550  1550               0.0951  39153.65              0.0763  48833.90   2.6e+01
  1600  1600               0.1032  39679.61              0.0816  50205.25   2.8e+01
  1650  1650               0.1145  39237.67              0.0904  49671.81   2.9e+01
  1700  1700               0.1247  39389.56              0.0988  49711.47   3.1e+01
  1750  1750               0.1353  39610.83              0.1086  49328.59   3.4e+01
  1800  1800               0.1466  39788.68              0.1151  50656.29   3.6e+01
  1850  1850               0.1605  39456.29              0.1261  50196.75   3.7e+01
  1900  1900               0.1722  39823.29              0.1364  50300.80   3.9e+01
  1950  1950               0.1859  39886.73              0.1486  49912.98   4.2e+01
  2000  2000               0.1990  40195.79              0.1566  51089.42   4.4e+01
$shell> cat report.strsm_Eigen
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS            Eigen: t    MFLOPS  Residual
    50    50               0.0001   1224.23              0.0001   1906.10   3.6e-03
   100   100               0.0002   5193.54              0.0002   4450.89   1.7e-02
   150   150               0.0004   7919.58              0.0006   6001.64   4.2e-02
   200   200               0.0008  10039.32              0.0011   7065.66   8.2e-02
   250   250               0.0015  10690.86              0.0021   7457.60   1.4e-01
   300   300               0.0023  11976.89              0.0033   8289.77   2.0e-01
   350   350               0.0015  29053.89              0.0023  18602.74   2.9e-01
   400   400               0.0020  31252.64              0.0032  20063.69   4.0e-01
   450   450               0.0034  26863.94              0.0046  20007.09   5.3e-01
   500   500               0.0038  32568.25              0.0059  21090.24   6.8e-01
   550   550               0.0050  33502.84              0.0080  20833.19   8.4e-01
   600   600               0.0063  34556.18              0.0100  21691.79   1.0e+00
   650   650               0.0080  34328.63              0.0127  21556.81   1.3e+00
   700   700               0.0098  35149.80              0.0153  22414.55   1.5e+00
   750   750               0.0118  35878.74              0.0190  22255.00   1.8e+00
   800   800               0.0140  36583.69              0.0226  22671.33   2.1e+00
   850   850               0.0170  36219.77              0.0272  22594.40   2.4e+00
   900   900               0.0198  36733.17              0.0315  23139.69   2.7e+00
   950   950               0.0231  37076.48              0.0373  23006.87   3.1e+00
  1000  1000               0.0265  37713.13              0.0426  23461.32   3.5e+00
  1050  1050               0.0311  37260.07              0.0496  23353.97   4.0e+00
  1100  1100               0.0354  37629.44              0.0559  23798.00   4.5e+00
  1150  1150               0.0401  37973.69              0.0644  23620.37   5.0e+00
  1200  1200               0.0449  38500.75              0.0718  24052.94   5.5e+00
  1250  1250               0.0514  37965.54              0.0818  23881.08   6.1e+00
  1300  1300               0.0575  38206.82              0.0906  24243.37   6.7e+00
  1350  1350               0.0639  38490.63              0.1020  24123.03   7.3e+00
  1400  1400               0.0706  38850.52              0.1122  24447.41   8.0e+00
  1450  1450               0.0789  38636.78              0.1252  24352.56   8.7e+00
  1500  1500               0.0867  38924.05              0.1368  24662.20   9.5e+00
  1550  1550               0.0950  39182.16              0.1521  24485.06   1.0e+01
  1600  1600               0.1033  39637.56              0.1661  24663.79   1.1e+01
  1650  1650               0.1145  39222.55              0.1823  24642.66   1.2e+01
  1700  1700               0.1246  39438.08              0.1967  24979.27   1.3e+01
  1750  1750               0.1353  39625.23              0.2164  24771.47   1.4e+01
  1800  1800               0.1466  39782.52              0.2327  25063.55   1.5e+01
  1850  1850               0.1600  39580.61              0.2542  24904.38   1.6e+01
  1900  1900               0.1723  39819.72              0.2722  25195.14   1.7e+01
  1950  1950               0.1858  39906.37              0.2964  25013.35   1.8e+01
  2000  2000               0.1991  40180.78              0.3169  25247.46   1.9e+01
$shell> cat report.strsm_openBLAS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS         openBLAS: t    MFLOPS  Residual
    50    50               0.0001   1224.23              0.0001   1153.24   4.9e-03
   100   100               0.0002   4992.54              0.0003   3603.06   1.9e-02
   150   150               0.0004   7786.87              0.0007   4780.89   4.2e-02
   200   200               0.0008  10019.12              0.0013   6252.31   8.1e-02
   250   250               0.0015  10674.56              0.0022   7121.24   1.3e-01
   300   300               0.0010  26759.99              0.0015  18136.69   1.9e-01
   350   350               0.0015  28949.82              0.0023  18943.73   2.7e-01
   400   400               0.0021  30847.57              0.0030  21554.98   3.7e-01
   450   450               0.0030  30757.18              0.0041  22445.52   4.7e-01
   500   500               0.0039  32300.31              0.0051  24451.79   5.9e-01
   550   550               0.0050  33508.51              0.0066  25106.49   7.4e-01
   600   600               0.0063  34475.68              0.0081  26654.84   8.9e-01
   650   650               0.0080  34199.94              0.0103  26762.31   1.1e+00
   700   700               0.0099  34816.92              0.0122  28085.29   1.3e+00
   750   750               0.0118  35815.78              0.0151  28015.13   1.5e+00
   800   800               0.0139  36719.28              0.0174  29442.23   1.7e+00
   850   850               0.0170  36198.30              0.0206  29830.19   1.9e+00
   900   900               0.0198  36792.87              0.0235  31027.71   2.2e+00
   950   950               0.0230  37237.65              0.0277  30919.09   2.5e+00
  1000  1000               0.0265  37760.18              0.0313  31962.41   2.8e+00
  1050  1050               0.0310  37304.01              0.0362  31957.12   3.2e+00
  1100  1100               0.0354  37636.58              0.0404  32923.68   3.5e+00
  1150  1150               0.0401  37953.58              0.0466  32659.07   3.9e+00
  1200  1200               0.0449  38494.89              0.0512  33739.25   4.3e+00
  1250  1250               0.0514  37976.41              0.0581  33591.92   4.7e+00
  1300  1300               0.0573  38352.66              0.0633  34734.04   5.2e+00
  1350  1350               0.0640  38435.62              0.0715  34418.96   5.7e+00
  1400  1400               0.0703  39017.92              0.0781  35156.15   6.2e+00
  1450  1450               0.0789  38648.38              0.0869  35063.81   6.7e+00
  1500  1500               0.0864  39056.17              0.0941  35869.66   7.2e+00
  1550  1550               0.0949  39226.50              0.1048  35530.19   7.8e+00
  1600  1600               0.1033  39643.18              0.1120  36567.58   8.4e+00
  1650  1650               0.1145  39229.39              0.1234  36394.11   9.1e+00
  1700  1700               0.1248  39355.12              0.1324  37119.16   9.7e+00
  1750  1750               0.1353  39601.20              0.1457  36782.00   1.0e+01
  1800  1800               0.1467  39751.73              0.1558  37443.65   1.1e+01
  1850  1850               0.1600  39574.13              0.1698  37287.93   1.2e+01
  1900  1900               0.1724  39795.63              0.1811  37882.90   1.3e+01
  1950  1950               0.1858  39917.67              0.1978  37480.30   1.3e+01
  2000  2000               0.1989  40222.01              0.2087  38338.00   1.4e+01
$shell> cat report.strsm_BLIS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS             BLIS: t    MFLOPS  Residual
    50    50               0.0002    535.55              0.0003    434.95   5.0e-03
   100   100               0.0001   7681.61              0.0002   4228.76   1.9e-02
   150   150               0.0003  12657.18              0.0005   6904.59   4.5e-02
   200   200               0.0006  14385.10              0.0009   9103.43   8.3e-02
   250   250               0.0010  16344.79              0.0016   9910.84   1.3e-01
   300   300               0.0016  16922.84              0.0024  11266.27   2.0e-01
   350   350               0.0012  37215.65              0.0016  26539.38   2.8e-01
   400   400               0.0016  39197.07              0.0022  28922.75   3.8e-01
   450   450               0.0024  38476.66              0.0031  29301.17   4.8e-01
   500   500               0.0032  39437.28              0.0041  30838.79   6.0e-01
   550   550               0.0042  39457.62              0.0050  33143.00   7.4e-01
   600   600               0.0054  40184.12              0.0064  33958.98   9.1e-01
   650   650               0.0070  39246.28              0.0080  34293.58   1.1e+00
   700   700               0.0087  39547.09              0.0098  35121.42   1.3e+00
   750   750               0.0105  40161.24              0.0115  36573.43   1.5e+00
   800   800               0.0125  41017.34              0.0137  37290.62   1.7e+00
   850   850               0.0158  38750.41              0.0166  37057.44   2.0e+00
   900   900               0.0179  40689.03              0.0192  37922.50   2.2e+00
   950   950               0.0209  40939.05              0.0222  38556.74   2.5e+00
  1000  1000               0.0242  41345.41              0.0254  39387.83   2.9e+00
  1050  1050               0.0282  41087.77              0.0297  38974.78   3.2e+00
  1100  1100               0.0328  40579.05              0.0333  39926.24   3.6e+00
  1150  1150               0.0366  41552.70              0.0376  40435.03   4.0e+00
  1200  1200               0.0421  41085.83              0.0422  40932.15   4.4e+00
  1250  1250               0.0471  41446.98              0.0476  41009.92   4.8e+00
  1300  1300               0.0532  41294.74              0.0531  41401.80   5.2e+00
  1350  1350               0.0589  41801.53              0.0587  41923.65   5.7e+00
  1400  1400               0.0649  42267.55              0.0647  42400.93   6.2e+00
  1450  1450               0.0732  41655.59              0.0726  41992.28   6.7e+00
  1500  1500               0.0805  41940.41              0.0794  42515.99   7.3e+00
  1550  1550               0.0889  41905.00              0.0874  42603.62   7.9e+00
  1600  1600               0.0960  42675.32              0.0947  43229.57   8.5e+00
  1650  1650               0.1073  41846.89              0.1047  42922.75   9.1e+00
  1700  1700               0.1172  41935.63              0.1140  43109.56   9.8e+00
  1750  1750               0.1280  41862.42              0.1232  43497.38   1.0e+01
  1800  1800               0.1389  41996.75              0.1335  43683.60   1.1e+01
  1850  1850               0.1516  41763.62              0.1457  43462.88   1.2e+01
  1900  1900               0.1629  42108.52              0.1566  43786.20   1.3e+01
  1950  1950               0.1763  42047.95              0.1683  44049.94   1.4e+01
  2000  2000               0.1887  42388.57              0.1808  44258.18   1.4e+01
$shell> 

Double Precision

$shell> cat report.dtrsm_MKL
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS              MKL: t    MFLOPS  Residual
    50    50               0.0001    975.91              0.0021     58.38   2.4e-11
   100   100               0.0003   3697.02              0.0001   8103.33   1.3e-10
   150   150               0.0007   5093.29              0.0004   8139.67   3.5e-10
   200   200               0.0013   6376.58              0.0008  10540.00   7.2e-10
   250   250               0.0023   6887.33              0.0016   9593.41   1.2e-09
   300   300               0.0016  16932.44              0.0012  21822.18   1.2e-09
   350   350               0.0025  17493.28              0.0018  23183.01   1.7e-09
   400   400               0.0034  18588.79              0.0028  23138.82   2.3e-09
   450   450               0.0049  18680.84              0.0039  23282.60   2.8e-09
   500   500               0.0064  19568.82              0.0052  23871.95   3.6e-09
   550   550               0.0084  19838.89              0.0072  23262.16   4.3e-09
   600   600               0.0106  20408.28              0.0090  24018.31   5.1e-09
   650   650               0.0135  20288.32              0.0114  24137.94   6.1e-09
   700   700               0.0165  20753.94              0.0142  24114.94   7.0e-09
   750   750               0.0203  20753.19              0.0175  24121.71   8.2e-09
   800   800               0.0241  21216.22              0.0217  23560.37   9.2e-09
   850   850               0.0292  21049.13              0.0258  23841.47   1.0e-08
   900   900               0.0341  21384.90              0.0304  24019.11   1.2e-08
   950   950               0.0399  21505.20              0.0355  24118.94   1.3e-08
  1000  1000               0.0461  21687.99              0.0410  24366.62   1.5e-08
  1050  1050               0.0539  21496.82              0.0476  24307.07   1.6e-08
  1100  1100               0.0609  21859.38              0.0546  24385.42   1.8e-08
  1150  1150               0.0694  21904.55              0.0635  23950.87   2.0e-08
  1200  1200               0.0783  22057.06              0.0702  24622.80   2.1e-08
  1250  1250               0.0890  21953.20              0.0785  24892.86   2.3e-08
  1300  1300               0.0992  22143.19              0.0890  24678.79   2.5e-08
  1350  1350               0.1111  22139.52              0.0992  24812.88   2.7e-08
  1400  1400               0.1232  22274.68              0.1113  24649.93   2.9e-08
  1450  1450               0.1375  22165.91              0.1222  24955.23   3.2e-08
  1500  1500               0.1512  22314.25              0.1355  24900.40   3.4e-08
  1550  1550               0.1674  22244.49              0.1500  24819.01   3.6e-08
  1600  1600               0.1828  22402.99              0.1726  23730.31   3.9e-08
  1650  1650               0.2010  22348.67              0.1799  24970.19   4.1e-08
  1700  1700               0.2184  22495.73              0.2000  24567.65   4.4e-08
  1750  1750               0.2385  22472.43              0.2153  24888.76   4.7e-08
  1800  1800               0.2585  22558.83              0.2380  24499.88   5.0e-08
  1850  1850               0.2816  22485.51              0.2559  24747.20   5.2e-08
  1900  1900               0.3032  22623.46              0.2921  23484.69   5.6e-08
  1950  1950               0.3285  22571.13              0.3006  24667.00   5.9e-08
  2000  2000               0.3545  22564.67              0.3284  24359.83   6.2e-08
$shell> cat report.dtrsm_Eigen
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS            Eigen: t    MFLOPS  Residual
    50    50               0.0001   1088.70              0.0001   1552.33   1.1e-11
   100   100               0.0003   3781.98              0.0003   3167.84   4.7e-11
   150   150               0.0007   5122.46              0.0009   3802.44   1.1e-10
   200   200               0.0006  14120.88              0.0009   9387.69   2.1e-10
   250   250               0.0010  15368.00              0.0016  10051.10   3.5e-10
   300   300               0.0016  16997.97              0.0026  10368.27   5.1e-10
   350   350               0.0024  17772.83              0.0040  10749.78   7.1e-10
   400   400               0.0034  18970.12              0.0059  10880.76   9.6e-10
   450   450               0.0048  18924.95              0.0082  11094.69   1.2e-09
   500   500               0.0064  19552.77              0.0110  11365.98   1.6e-09
   550   550               0.0084  19813.81              0.0146  11392.56   1.9e-09
   600   600               0.0106  20338.22              0.0188  11499.33   2.3e-09
   650   650               0.0136  20255.62              0.0235  11670.93   2.8e-09
   700   700               0.0166  20715.68              0.0290  11844.64   3.3e-09
   750   750               0.0202  20922.47              0.0352  11983.35   3.9e-09
   800   800               0.0240  21322.42              0.0426  12015.50   4.5e-09
   850   850               0.0291  21084.66              0.0507  12113.57   5.1e-09
   900   900               0.0341  21408.01              0.0598  12186.92   5.9e-09
   950   950               0.0399  21513.04              0.0701  12232.42   6.6e-09
  1000  1000               0.0462  21658.62              0.0812  12320.21   7.5e-09
  1050  1050               0.0535  21627.38              0.0936  12362.18   8.3e-09
  1100  1100               0.0607  21913.75              0.1070  12435.49   9.3e-09
  1150  1150               0.0695  21897.78              0.1218  12486.30   1.0e-08
  1200  1200               0.0783  22059.27              0.1376  12561.36   1.1e-08
  1250  1250               0.0888  21987.39              0.1552  12581.02   1.2e-08
  1300  1300               0.0991  22177.30              0.1744  12598.24   1.4e-08
  1350  1350               0.1110  22158.97              0.1950  12620.26   1.5e-08
  1400  1400               0.1231  22291.93              0.2168  12656.56   1.6e-08
  1450  1450               0.1374  22195.69              0.2403  12686.53   1.8e-08
  1500  1500               0.1511  22342.79              0.2658  12695.50   1.9e-08
  1550  1550               0.1674  22249.63              0.2934  12691.54   2.1e-08
  1600  1600               0.1827  22424.81              0.3241  12639.83   2.2e-08
  1650  1650               0.2008  22374.39              0.3516  12774.53   2.4e-08
  1700  1700               0.2182  22515.21              0.3843  12782.67   2.6e-08
  1750  1750               0.2385  22470.64              0.4192  12784.16   2.7e-08
  1800  1800               0.2586  22550.25              0.4551  12815.74   2.9e-08
  1850  1850               0.2812  22514.31              0.4940  12817.49   3.1e-08
  1900  1900               0.3030  22634.55              0.5348  12826.16   3.3e-08
  1950  1950               0.3283  22588.96              0.5783  12822.18   3.5e-08
  2000  2000               0.3537  22617.46              0.6224  12853.55   3.8e-08
$shell> cat report.dtrsm_openBLAS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS         openBLAS: t    MFLOPS  Residual
    50    50               0.0001   1102.79              0.0001   1401.58   7.1e-12
   100   100               0.0003   3769.03              0.0003   3852.18   2.7e-11
   150   150               0.0007   5115.40              0.0006   5255.59   6.0e-11
   200   200               0.0013   6390.81              0.0013   6363.47   1.1e-10
   250   250               0.0021   7329.57              0.0010  15621.27   1.8e-10
   300   300               0.0016  16630.90              0.0015  17648.24   2.7e-10
   350   350               0.0024  17824.43              0.0023  18419.68   3.9e-10
   400   400               0.0034  18856.52              0.0033  19325.78   5.3e-10
   450   450               0.0048  18893.18              0.0046  19664.53   7.0e-10
   500   500               0.0064  19518.87              0.0063  19855.82   8.9e-10
   550   550               0.0084  19819.58              0.0082  20185.52   1.1e-09
   600   600               0.0106  20323.67              0.0105  20661.87   1.4e-09
   650   650               0.0136  20207.51              0.0131  21043.78   1.6e-09
   700   700               0.0166  20683.23              0.0160  21376.79   1.9e-09
   750   750               0.0203  20811.25              0.0195  21603.23   2.3e-09
   800   800               0.0241  21229.67              0.0234  21905.57   2.7e-09
   850   850               0.0292  21055.33              0.0276  22219.98   3.0e-09
   900   900               0.0341  21382.49              0.0323  22547.83   3.5e-09
   950   950               0.0399  21502.27              0.0378  22654.52   3.9e-09
  1000  1000               0.0461  21700.74              0.0436  22912.15   4.4e-09
  1050  1050               0.0536  21591.60              0.0500  23151.50   4.9e-09
  1100  1100               0.0609  21847.33              0.0570  23341.70   5.5e-09
  1150  1150               0.0695  21894.50              0.0649  23422.03   6.2e-09
  1200  1200               0.0784  22042.86              0.0733  23560.21   6.8e-09
  1250  1250               0.0890  21953.01              0.0823  23742.38   7.5e-09
  1300  1300               0.0992  22136.35              0.0921  23849.65   8.3e-09
  1350  1350               0.1112  22120.47              0.1029  23906.07   9.1e-09
  1400  1400               0.1233  22256.31              0.1145  23970.56   9.9e-09
  1450  1450               0.1376  22149.35              0.1263  24141.64   1.1e-08
  1500  1500               0.1510  22345.99              0.1392  24252.14   1.2e-08
  1550  1550               0.1674  22239.44              0.1538  24207.08   1.3e-08
  1600  1600               0.1829  22398.55              0.1686  24301.15   1.4e-08
  1650  1650               0.2011  22341.68              0.1836  24464.18   1.5e-08
  1700  1700               0.2185  22487.36              0.2002  24544.29   1.6e-08
  1750  1750               0.2388  22445.27              0.2180  24580.00   1.7e-08
  1800  1800               0.2586  22550.56              0.2377  24532.36   1.8e-08
  1850  1850               0.2817  22477.02              0.2562  24712.74   1.9e-08
  1900  1900               0.3030  22639.50              0.2770  24758.46   2.1e-08
  1950  1950               0.3290  22534.40              0.2992  24782.83   2.2e-08
  2000  2000               0.3539  22605.70              0.3232  24752.33   2.3e-08
$shell> cat report.dtrsm_BLIS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS             BLIS: t    MFLOPS  Residual
    50    50               0.0002    613.80              0.0003    475.01   7.2e-12
   100   100               0.0001  11537.88              0.0002   6324.43   2.9e-11
   150   150               0.0002  19716.43              0.0004   9432.99   6.4e-11
   200   200               0.0004  22714.37              0.0007  11974.56   1.1e-10
   250   250               0.0007  23083.79              0.0012  13121.10   1.8e-10
   300   300               0.0011  24571.10              0.0019  14430.28   2.9e-10
   350   350               0.0017  25257.49              0.0028  15510.97   4.0e-10
   400   400               0.0024  26124.34              0.0039  16464.94   5.5e-10
   450   450               0.0037  24851.09              0.0055  16694.78   7.1e-10
   500   500               0.0049  25322.20              0.0072  17293.63   9.0e-10
   550   550               0.0067  24971.19              0.0093  17937.72   1.1e-09
   600   600               0.0086  25192.53              0.0116  18604.51   1.4e-09
   650   650               0.0112  24520.09              0.0146  18757.64   1.7e-09
   700   700               0.0138  24788.02              0.0177  19328.18   2.0e-09
   750   750               0.0167  25305.39              0.0213  19800.48   2.3e-09
   800   800               0.0202  25329.57              0.0255  20058.75   2.7e-09
   850   850               0.0250  24539.94              0.0305  20124.63   3.1e-09
   900   900               0.0293  24840.49              0.0357  20417.06   3.5e-09
   950   950               0.0343  24991.58              0.0413  20744.09   4.0e-09
  1000  1000               0.0398  25124.99              0.0478  20918.15   4.5e-09
  1050  1050               0.0471  24599.51              0.0553  20914.91   5.0e-09
  1100  1100               0.0535  24859.49              0.0630  21130.84   5.6e-09
  1150  1150               0.0607  25070.80              0.0714  21304.57   6.2e-09
  1200  1200               0.0695  24847.49              0.0803  21524.69   6.9e-09
  1250  1250               0.0789  24759.12              0.0910  21461.24   7.6e-09
  1300  1300               0.0887  24775.59              0.1016  21632.31   8.3e-09
  1350  1350               0.0990  24856.99              0.1131  21755.11   9.2e-09
  1400  1400               0.1103  24868.24              0.1256  21847.49   1.0e-08
  1450  1450               0.1239  24608.77              0.1398  21814.69   1.1e-08
  1500  1500               0.1361  24799.21              0.1535  21991.72   1.2e-08
  1550  1550               0.1517  24551.20              0.1687  22079.59   1.3e-08
  1600  1600               0.1657  24718.34              0.1845  22198.68   1.4e-08
  1650  1650               0.1833  24510.48              0.2028  22150.90   1.5e-08
  1700  1700               0.1994  24634.52              0.2211  22220.56   1.6e-08
  1750  1750               0.2180  24586.84              0.2398  22348.65   1.7e-08
  1800  1800               0.2368  24632.76              0.2606  22381.26   1.8e-08
  1850  1850               0.2579  24554.29              0.2828  22390.50   1.9e-08
  1900  1900               0.2794  24551.58              0.3053  22463.17   2.1e-08
  1950  1950               0.3027  24493.56              0.3290  22538.18   2.2e-08
  2000  2000               0.3271  24454.91              0.3540  22600.88   2.3e-08
$shell> 

Complex Single Precision

$shell> cat report.ctrsm_MKL
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS              MKL: t    MFLOPS  Residual
    50    50               0.0002    593.05              0.0021     59.03   2.9e-02
   100   100               0.0005   1840.44              0.0002   4584.88   1.6e-01
   150   150               0.0013   2545.17              0.0008   4117.33   4.4e-01
   200   200               0.0026   3103.29              0.0014   5638.35   9.2e-01
   250   250               0.0022   7181.35              0.0014  11266.38   1.6e+00
   300   300               0.0034   7895.47              0.0023  11878.25   1.6e+00
   350   350               0.0051   8457.79              0.0037  11734.42   2.2e+00
   400   400               0.0071   9024.29              0.0051  12434.21   2.9e+00
   450   450               0.0101   8990.43              0.0074  12282.38   3.6e+00
   500   500               0.0134   9330.21              0.0099  12646.96   4.6e+00
   550   550               0.0174   9554.47              0.0137  12183.95   5.5e+00
   600   600               0.0219   9852.68              0.0172  12579.42   6.6e+00
   650   650               0.0281   9773.69              0.0221  12410.22   7.8e+00
   700   700               0.0344   9975.37              0.0272  12613.09   9.0e+00
   750   750               0.0417  10120.40              0.0337  12508.78   1.0e+01
   800   800               0.0495  10345.87              0.0397  12892.09   1.2e+01
   850   850               0.0599  10245.33              0.0484  12694.55   1.3e+01
   900   900               0.0702  10386.22              0.0567  12855.68   1.5e+01
   950   950               0.0815  10516.89              0.0666  12870.20   1.7e+01
  1000  1000               0.0936  10681.44              0.0766  13057.96   1.9e+01
  1050  1050               0.1094  10578.16              0.0903  12813.23   2.1e+01
  1100  1100               0.1244  10695.12              0.1030  12925.01   2.3e+01
  1150  1150               0.1411  10779.89              0.1182  12866.24   2.5e+01
  1200  1200               0.1586  10895.20              0.1328  13013.05   2.7e+01
  1250  1250               0.1808  10802.29              0.1507  12958.38   2.9e+01
  1300  1300               0.2018  10886.26              0.1683  13052.64   3.2e+01
  1350  1350               0.2247  10947.24              0.1890  13016.69   3.4e+01
  1400  1400               0.2488  11029.94              0.2093  13109.54   3.7e+01
  1450  1450               0.2782  10959.38              0.2333  13066.15   4.0e+01
  1500  1500               0.3060  11029.79              0.2569  13138.78   4.3e+01
  1550  1550               0.3373  11041.03              0.2869  12980.21   4.6e+01
  1600  1600               0.3673  11152.39              0.3133  13072.18   4.9e+01
  1650  1650               0.4050  11090.71              0.3444  13043.91   5.2e+01
  1700  1700               0.4411  11138.24              0.3758  13074.08   5.5e+01
  1750  1750               0.4794  11178.30              0.4109  13043.69   5.9e+01
  1800  1800               0.5205  11204.84              0.4451  13103.79   6.2e+01
  1850  1850               0.5661  11183.80              0.4842  13076.29   6.6e+01
  1900  1900               0.6124  11200.21              0.5232  13109.87   7.0e+01
  1950  1950               0.6583  11264.40              0.5667  13084.32   7.3e+01
  2000  2000               0.7074  11308.72              0.6090  13135.44   7.7e+01
$shell> cat report.ctrsm_Eigen
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS            Eigen: t    MFLOPS  Residual
    50    50               0.0002    663.63              0.0003    414.60   1.3e-02
   100   100               0.0006   1737.69              0.0013    777.38   5.4e-02
   150   150               0.0013   2513.01              0.0033   1036.51   1.3e-01
   200   200               0.0012   6884.76              0.0029   2759.88   2.3e-01
   250   250               0.0022   7230.56              0.0050   3141.41   3.8e-01
   300   300               0.0034   7940.39              0.0079   3431.00   5.5e-01
   350   350               0.0051   8441.97              0.0116   3700.79   7.6e-01
   400   400               0.0071   9010.62              0.0164   3899.83   1.0e+00
   450   450               0.0101   8981.02              0.0224   4076.16   1.3e+00
   500   500               0.0134   9313.41              0.0294   4244.72   1.6e+00
   550   550               0.0174   9543.14              0.0378   4396.17   2.0e+00
   600   600               0.0219   9859.02              0.0478   4516.02   2.5e+00
   650   650               0.0281   9762.78              0.0592   4635.94   2.9e+00
   700   700               0.0345   9943.38              0.0724   4738.96   3.5e+00
   750   750               0.0417  10119.16              0.0872   4838.92   4.0e+00
   800   800               0.0496  10332.44              0.1041   4917.36   4.7e+00
   850   850               0.0600  10236.32              0.1228   5002.59   5.3e+00
   900   900               0.0702  10382.57              0.1439   5067.72   6.1e+00
   950   950               0.0818  10484.97              0.1669   5138.19   6.9e+00
  1000  1000               0.0939  10650.04              0.1926   5193.18   7.7e+00
  1050  1050               0.1095  10572.42              0.2203   5254.09   8.6e+00
  1100  1100               0.1246  10686.29              0.2510   5302.80   9.6e+00
  1150  1150               0.1411  10778.44              0.2839   5356.58   1.1e+01
  1200  1200               0.1586  10896.11              0.3199   5400.99   1.2e+01
  1250  1250               0.1808  10803.17              0.3587   5444.26   1.3e+01
  1300  1300               0.2019  10880.47              0.4008   5481.59   1.4e+01
  1350  1350               0.2247  10947.63              0.4460   5516.84   1.5e+01
  1400  1400               0.2487  11035.53              0.4940   5554.40   1.7e+01
  1450  1450               0.2784  10952.17              0.5454   5589.44   1.8e+01
  1500  1500               0.3059  11031.75              0.6008   5617.20   2.0e+01
  1550  1550               0.3372  11044.24              0.6594   5647.20   2.1e+01
  1600  1600               0.3673  11152.34              0.7225   5669.55   2.3e+01
  1650  1650               0.4050  11092.16              0.7880   5700.57   2.4e+01
  1700  1700               0.4413  11132.78              0.8583   5723.98   2.6e+01
  1750  1750               0.4792  11185.04              0.9330   5743.95   2.8e+01
  1800  1800               0.5206  11201.78              1.0105   5771.54   3.0e+01
  1850  1850               0.5665  11175.89              1.0961   5776.60   3.2e+01
  1900  1900               0.6123  11201.20              1.1826   5799.71   3.4e+01
  1950  1950               0.6585  11259.56              1.2752   5814.83   3.6e+01
  2000  2000               0.7073  11310.03              1.3715   5833.09   3.8e+01
$shell> cat report.ctrsm_openBLAS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS         openBLAS: t    MFLOPS  Residual
    50    50               0.0002    709.68              0.0001    876.08   5.7e-03
   100   100               0.0005   1829.38              0.0006   1774.74   2.4e-02
   150   150               0.0013   2506.62              0.0015   2246.95   5.7e-02
   200   200               0.0019   4143.86              0.0013   6059.50   1.1e-01
   250   250               0.0022   7247.42              0.0024   6442.84   1.8e-01
   300   300               0.0034   7929.64              0.0039   6950.26   2.6e-01
   350   350               0.0051   8399.13              0.0059   7275.19   3.8e-01
   400   400               0.0072   8884.39              0.0083   7726.26   5.0e-01
   450   450               0.0102   8950.10              0.0115   7921.49   6.6e-01
   500   500               0.0135   9288.08              0.0155   8057.47   8.4e-01
   550   550               0.0175   9508.10              0.0199   8339.74   1.1e+00
   600   600               0.0220   9834.25              0.0251   8602.62   1.3e+00
   650   650               0.0282   9745.86              0.0310   8855.60   1.6e+00
   700   700               0.0345   9947.97              0.0379   9056.13   1.9e+00
   750   750               0.0418  10102.35              0.0458   9208.33   2.2e+00
   800   800               0.0495  10345.04              0.0533   9599.16   2.6e+00
   850   850               0.0601  10217.13              0.0632   9721.67   2.9e+00
   900   900               0.0702  10386.18              0.0744   9798.21   3.4e+00
   950   950               0.0817  10490.53              0.0868   9877.93   3.8e+00
  1000  1000               0.0939  10652.60              0.0996  10042.12   4.3e+00
  1050  1050               0.1096  10559.21              0.1144  10121.76   4.9e+00
  1100  1100               0.1249  10655.63              0.1304  10203.27   5.4e+00
  1150  1150               0.1415  10746.71              0.1480  10278.03   6.1e+00
  1200  1200               0.1591  10860.38              0.1658  10422.11   6.7e+00
  1250  1250               0.1812  10777.62              0.1852  10545.79   7.4e+00
  1300  1300               0.2024  10854.94              0.2083  10547.52   8.2e+00
  1350  1350               0.2253  10920.07              0.2321  10601.53   8.9e+00
  1400  1400               0.2495  10997.69              0.2557  10733.39   9.8e+00
  1450  1450               0.2790  10925.10              0.2825  10793.32   1.1e+01
  1500  1500               0.3070  10992.50              0.3122  10809.01   1.1e+01
  1550  1550               0.3384  11004.79              0.3439  10828.26   1.2e+01
  1600  1600               0.3684  11118.87              0.3741  10947.90   1.3e+01
  1650  1650               0.4063  11055.49              0.4074  11025.70   1.4e+01
  1700  1700               0.4428  11094.58              0.4451  11039.11   1.6e+01
  1750  1750               0.4803  11158.31              0.4840  11073.49   1.7e+01
  1800  1800               0.5221  11171.08              0.5223  11166.61   1.8e+01
  1850  1850               0.5680  11148.15              0.5670  11166.74   1.9e+01
  1900  1900               0.6143  11166.29              0.6145  11161.97   2.0e+01
  1950  1950               0.6602  11231.32              0.6630  11184.63   2.2e+01
  2000  2000               0.7094  11277.49              0.7096  11274.25   2.3e+01
$shell> cat report.ctrsm_BLIS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS             BLIS: t    MFLOPS  Residual
    50    50               0.0003    435.90              0.0002    769.82   8.8e-03
   100   100               0.0001   7081.40              0.0002   4155.12   3.5e-02
   150   150               0.0006   5750.94              0.0009   3632.11   8.6e-02
   200   200               0.0008  10324.34              0.0011   7142.32   1.6e-01
   250   250               0.0015  10168.08              0.0021   7546.65   2.6e-01
   300   300               0.0025  10788.07              0.0032   8321.16   3.9e-01
   350   350               0.0041  10535.25              0.0048   8885.77   5.5e-01
   400   400               0.0057  11320.99              0.0067   9597.31   7.3e-01
   450   450               0.0083  10963.17              0.0095   9603.72   9.5e-01
   500   500               0.0111  11216.68              0.0125  10007.45   1.2e+00
   550   550               0.0147  11282.18              0.0161  10307.30   1.5e+00
   600   600               0.0188  11514.91              0.0204  10563.54   1.8e+00
   650   650               0.0245  11201.33              0.0262  10491.07   2.2e+00
   700   700               0.0300  11429.30              0.0318  10779.55   2.5e+00
   750   750               0.0365  11543.60              0.0384  10984.52   3.0e+00
   800   800               0.0435  11771.59              0.0458  11172.11   3.4e+00
   850   850               0.0530  11580.80              0.0550  11168.93   3.9e+00
   900   900               0.0624  11684.45              0.0644  11314.73   4.4e+00
   950   950               0.0727  11790.77              0.0748  11461.88   5.0e+00
  1000  1000               0.0840  11910.15              0.0863  11591.18   5.6e+00
  1050  1050               0.0983  11772.79              0.1003  11538.62   6.3e+00
  1100  1100               0.1120  11879.51              0.1141  11661.53   7.0e+00
  1150  1150               0.1273  11950.20              0.1296  11737.58   7.8e+00
  1200  1200               0.1437  12024.34              0.1457  11857.26   8.6e+00
  1250  1250               0.1644  11881.30              0.1656  11794.96   9.4e+00
  1300  1300               0.1845  11908.19              0.1848  11890.29   1.0e+01
  1350  1350               0.2068  11897.59              0.2060  11942.56   1.1e+01
  1400  1400               0.2292  11973.79              0.2284  12016.10   1.2e+01
  1450  1450               0.2572  11853.21              0.2547  11970.57   1.3e+01
  1500  1500               0.2836  11899.88              0.2801  12047.74   1.4e+01
  1550  1550               0.3125  11918.00              0.3095  12030.68   1.6e+01
  1600  1600               0.3412  12003.04              0.3369  12159.13   1.7e+01
  1650  1650               0.3776  11896.97              0.3707  12118.04   1.8e+01
  1700  1700               0.4117  11934.85              0.4047  12141.26   1.9e+01
  1750  1750               0.4473  11982.12              0.4410  12153.21   2.1e+01
  1800  1800               0.4877  11959.13              0.4761  12250.05   2.2e+01
  1850  1850               0.5307  11931.79              0.5198  12180.14   2.3e+01
  1900  1900               0.5748  11933.22              0.5609  12228.05   2.5e+01
  1950  1950               0.6186  11986.72              0.6049  12258.53   2.6e+01
  2000  2000               0.6665  12003.36              0.6509  12290.52   2.8e+01
$shell> 

Complex Double Precision

$shell> cat report.ztrsm_MKL
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS              MKL: t    MFLOPS  Residual
    50    50               0.0002    610.03              0.0021     58.61   5.5e-11
   100   100               0.0006   1539.14              0.0004   2503.25   3.1e-10
   150   150               0.0019   1766.60              0.0014   2341.00   5.3e-10
   200   200               0.0017   4600.71              0.0014   5867.37   9.7e-10
   250   250               0.0033   4725.58              0.0026   6126.34   1.5e-09
   300   300               0.0053   5057.52              0.0044   6070.24   2.2e-09
   350   350               0.0085   5063.84              0.0070   6110.50   2.9e-09
   400   400               0.0121   5291.36              0.0104   6128.91   3.9e-09
   450   450               0.0174   5244.08              0.0149   6120.53   5.0e-09
   500   500               0.0231   5417.16              0.0203   6152.73   6.1e-09
   550   550               0.0310   5370.95              0.0272   6125.89   7.3e-09
   600   600               0.0393   5493.74              0.0351   6148.72   8.7e-09
   650   650               0.0504   5448.28              0.0442   6206.95   1.0e-08
   700   700               0.0617   5556.33              0.0551   6227.74   1.2e-08
   750   750               0.0761   5543.13              0.0671   6286.01   1.4e-08
   800   800               0.0907   5646.11              0.0822   6228.96   1.6e-08
   850   850               0.1096   5601.22              0.0980   6267.92   1.8e-08
   900   900               0.1282   5684.25              0.1162   6272.92   2.0e-08
   950   950               0.1518   5648.57              0.1358   6311.31   2.2e-08
  1000  1000               0.1752   5708.27              0.1588   6296.72   2.4e-08
  1050  1050               0.2041   5671.46              0.1842   6283.08   2.7e-08
  1100  1100               0.2325   5724.45              0.2119   6279.82   3.0e-08
  1150  1150               0.2668   5699.66              0.2406   6321.95   3.2e-08
  1200  1200               0.3014   5734.00              0.2741   6305.40   3.5e-08
  1250  1250               0.3421   5709.34              0.3079   6343.69   3.8e-08
  1300  1300               0.3823   5746.42              0.3496   6284.59   4.1e-08
  1350  1350               0.4301   5720.09              0.3907   6297.41   4.5e-08
  1400  1400               0.4762   5762.61              0.4356   6299.58   4.8e-08
  1450  1450               0.5333   5716.16              0.4816   6330.36   5.1e-08
  1500  1500               0.5858   5761.57              0.5350   6308.37   5.5e-08
  1550  1550               0.6506   5723.57              0.5894   6317.83   5.9e-08
  1600  1600               0.7056   5805.18              0.6501   6300.94   6.3e-08
  1650  1650               0.7824   5741.20              0.7088   6337.42   6.7e-08
  1700  1700               0.8535   5756.47              0.7772   6321.05   7.1e-08
  1750  1750               0.9335   5741.28              0.8428   6359.35   7.5e-08
  1800  1800               1.0109   5768.83              0.9237   6314.08   8.0e-08
  1850  1850               1.0991   5760.57              0.9971   6349.87   8.4e-08
  1900  1900               1.1892   5767.55              1.0850   6321.59   8.8e-08
  1950  1950               1.2864   5764.19              1.1663   6357.38   9.3e-08
  2000  2000               1.3911   5750.77              1.2641   6328.66   9.8e-08
$shell> cat report.ztrsm_Eigen
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS            Eigen: t    MFLOPS  Residual
    50    50               0.0002    650.85              0.0003    400.59   2.9e-11
   100   100               0.0006   1547.12              0.0015    652.54   1.2e-10
   150   150               0.0019   1773.14              0.0022   1551.77   2.9e-10
   200   200               0.0017   4628.23              0.0041   1930.90   5.2e-10
   250   250               0.0033   4673.46              0.0074   2105.87   8.2e-10
   300   300               0.0053   5074.11              0.0119   2266.13   1.2e-09
   350   350               0.0085   5060.54              0.0180   2379.98   1.6e-09
   400   400               0.0121   5283.55              0.0263   2435.63   2.1e-09
   450   450               0.0174   5246.83              0.0363   2507.22   2.7e-09
   500   500               0.0231   5414.99              0.0486   2573.01   3.3e-09
   550   550               0.0310   5367.43              0.0630   2639.13   4.0e-09
   600   600               0.0393   5498.24              0.0805   2683.03   4.7e-09
   650   650               0.0504   5448.63              0.1013   2710.51   5.6e-09
   700   700               0.0618   5552.54              0.1246   2753.66   6.5e-09
   750   750               0.0761   5540.65              0.1511   2792.07   7.5e-09
   800   800               0.0907   5646.20              0.1815   2821.45   8.5e-09
   850   850               0.1097   5596.82              0.2152   2854.30   9.6e-09
   900   900               0.1284   5679.33              0.2537   2873.79   1.1e-08
   950   950               0.1518   5649.51              0.2960   2896.06   1.2e-08
  1000  1000               0.1751   5710.50              0.3430   2915.43   1.3e-08
  1050  1050               0.2043   5667.34              0.3947   2933.09   1.5e-08
  1100  1100               0.2325   5724.76              0.4515   2947.80   1.6e-08
  1150  1150               0.2668   5700.91              0.5134   2962.26   1.8e-08
  1200  1200               0.3015   5732.18              0.5799   2979.69   1.9e-08
  1250  1250               0.3422   5707.21              0.6534   2989.03   2.1e-08
  1300  1300               0.3828   5739.83              0.7349   2989.36   2.2e-08
  1350  1350               0.4306   5714.12              0.8204   2999.08   2.4e-08
  1400  1400               0.4766   5757.84              0.9116   3010.16   2.6e-08
  1450  1450               0.5333   5716.02              1.0092   3020.95   2.8e-08
  1500  1500               0.5861   5758.70              1.1143   3028.70   3.0e-08
  1550  1550               0.6509   5721.14              1.2207   3050.66   3.2e-08
  1600  1600               0.7061   5801.24              1.3445   3046.54   3.4e-08
  1650  1650               0.7827   5738.97              1.4636   3069.15   3.6e-08
  1700  1700               0.8544   5750.23              1.5986   3073.32   3.8e-08
  1750  1750               0.9342   5736.87              1.7399   3080.24   4.1e-08
  1800  1800               1.0121   5762.43              1.8892   3087.05   4.3e-08
  1850  1850               1.1014   5748.91              2.0473   3092.72   4.6e-08
  1900  1900               1.1915   5756.68              2.2155   3095.98   4.8e-08
  1950  1950               1.2883   5755.77              2.3897   3102.91   5.0e-08
  2000  2000               1.3900   5755.27              2.5733   3108.80   5.3e-08
$shell> cat report.ztrsm_openBLAS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS         openBLAS: t    MFLOPS  Residual
    50    50               0.0002    657.54              0.0002    663.14   1.7e-11
   100   100               0.0006   1546.11              0.0009   1078.04   6.8e-11
   150   150               0.0019   1768.93              0.0028   1212.28   1.5e-10
   200   200               0.0017   4631.79              0.0028   2887.68   2.8e-10
   250   250               0.0033   4669.56              0.0051   3077.41   4.5e-10
   300   300               0.0053   5074.18              0.0086   3131.32   6.8e-10
   350   350               0.0085   5058.41              0.0135   3165.46   9.5e-10
   400   400               0.0121   5279.83              0.0202   3167.67   1.3e-09
   450   450               0.0175   5213.30              0.0285   3197.81   1.7e-09
   500   500               0.0231   5414.07              0.0388   3222.01   2.1e-09
   550   550               0.0310   5367.38              0.0513   3244.77   2.6e-09
   600   600               0.0393   5501.94              0.0664   3255.29   3.2e-09
   650   650               0.0504   5448.19              0.0841   3266.19   3.9e-09
   700   700               0.0617   5556.06              0.1044   3285.78   4.6e-09
   750   750               0.0758   5562.43              0.1280   3297.14   5.4e-09
   800   800               0.0907   5647.28              0.1548   3306.62   6.3e-09
   850   850               0.1098   5593.84              0.1851   3317.57   7.3e-09
   900   900               0.1283   5684.20              0.2192   3325.41   8.3e-09
   950   950               0.1517   5651.34              0.2576   3328.63   9.5e-09
  1000  1000               0.1750   5714.03              0.2998   3335.72   1.1e-08
  1050  1050               0.2041   5670.51              0.3465   3340.45   1.2e-08
  1100  1100               0.2321   5734.50              0.3977   3347.11   1.3e-08
  1150  1150               0.2669   5699.11              0.4540   3350.27   1.5e-08
  1200  1200               0.3012   5737.43              0.5153   3353.62   1.7e-08
  1250  1250               0.3422   5708.18              0.5820   3356.00   1.8e-08
  1300  1300               0.3822   5748.69              0.6537   3360.68   2.0e-08
  1350  1350               0.4299   5723.47              0.7320   3361.27   2.2e-08
  1400  1400               0.4765   5758.62              0.8155   3364.72   2.4e-08
  1450  1450               0.5330   5720.00              0.9057   3365.98   2.6e-08
  1500  1500               0.5861   5758.57              1.0016   3369.73   2.8e-08
  1550  1550               0.6506   5723.82              1.1045   3371.70   3.1e-08
  1600  1600               0.7051   5809.48              1.2132   3376.31   3.3e-08
  1650  1650               0.7828   5738.89              1.3307   3375.70   3.6e-08
  1700  1700               0.8529   5760.25              1.4520   3383.52   3.8e-08
  1750  1750               0.9337   5740.10              1.5844   3382.52   4.1e-08
  1800  1800               1.0118   5764.03              1.7218   3387.08   4.4e-08
  1850  1850               1.0996   5758.37              1.8690   3387.66   4.7e-08
  1900  1900               1.1882   5772.58              2.0230   3390.43   5.0e-08
  1950  1950               1.2862   5764.78              2.1875   3389.61   5.4e-08
  2000  2000               1.3905   5753.51              2.3576   3393.21   5.7e-08
$shell> cat report.ztrsm_BLIS
#    m     n     k     FLENS/ulmBLAS: t    MFLOPS             BLIS: t    MFLOPS  Residual
    50    50               0.0003    425.54              0.0003    411.55   1.2e-11
   100   100               0.0004   2628.22              0.0005   2016.70   5.0e-11
   150   150               0.0007   4945.28              0.0009   3947.82   1.3e-10
   200   200               0.0014   5732.88              0.0018   4550.81   2.5e-10
   250   250               0.0028   5626.25              0.0033   4803.81   4.1e-10
   300   300               0.0046   5848.82              0.0053   5088.94   6.2e-10
   350   350               0.0076   5636.85              0.0082   5235.32   8.9e-10
   400   400               0.0109   5881.22              0.0117   5487.98   1.2e-09
   450   450               0.0158   5765.38              0.0164   5550.37   1.6e-09
   500   500               0.0210   5962.46              0.0219   5712.50   2.0e-09
   550   550               0.0287   5793.41              0.0290   5737.99   2.5e-09
   600   600               0.0364   5933.06              0.0370   5842.52   3.1e-09
   650   650               0.0465   5903.52              0.0467   5882.85   3.7e-09
   700   700               0.0571   6003.13              0.0584   5871.68   4.5e-09
   750   750               0.0716   5889.71              0.0708   5957.79   5.3e-09
   800   800               0.0850   6022.18              0.0850   6021.02   6.2e-09
   850   850               0.1031   5955.45              0.1022   6006.54   7.1e-09
   900   900               0.1206   6043.33              0.1198   6084.06   8.2e-09
   950   950               0.1430   5996.65              0.1411   6076.26   9.3e-09
  1000  1000               0.1656   6038.99              0.1636   6112.13   1.0e-08
  1050  1050               0.1951   5934.76              0.1897   6102.55   1.2e-08
  1100  1100               0.2210   6023.05              0.2168   6140.27   1.3e-08
  1150  1150               0.2542   5982.20              0.2480   6131.82   1.5e-08
  1200  1200               0.2867   6027.10              0.2803   6164.79   1.6e-08
  1250  1250               0.3278   5959.06              0.3170   6161.90   1.8e-08
  1300  1300               0.3663   5997.60              0.3549   6189.64   2.0e-08
  1350  1350               0.4130   5956.83              0.3986   6173.15   2.2e-08
  1400  1400               0.4575   5997.90              0.4419   6210.24   2.4e-08
  1450  1450               0.5126   5946.85              0.4927   6187.71   2.6e-08
  1500  1500               0.5624   6000.81              0.5429   6216.75   2.8e-08
  1550  1550               0.6268   5941.05              0.5997   6209.40   3.0e-08
  1600  1600               0.6811   6013.96              0.6560   6243.51   3.3e-08
  1650  1650               0.7539   5958.64              0.7216   6225.09   3.5e-08
  1700  1700               0.8278   5935.14              0.7867   6244.83   3.8e-08
  1750  1750               0.9013   5946.22              0.8593   6236.91   4.1e-08
  1800  1800               0.9798   5951.97              0.9319   6258.19   4.4e-08
  1850  1850               1.0641   5950.19              1.0137   6246.12   4.7e-08
  1900  1900               1.1527   5950.42              1.0965   6255.14   5.0e-08
  1950  1950               1.2478   5942.41              1.1867   6248.18   5.3e-08
  2000  2000               1.3503   5924.59              1.2788   6255.90   5.6e-08
$shell>