TRSM (Triangular Solver)
Single Precision
Double Precision
Complex Single Precision
Complex Double Precision
Raw Results from Benchmarks
$shell> make BLAS_FUNCTIONS=trsm clean
rm -f strsm_openBLAS dtrsm_openBLAS ctrsm_openBLAS ztrsm_openBLAS strsm_BLIS dtrsm_BLIS ctrsm_BLIS ztrsm_BLIS strsm_Eigen dtrsm_Eigen ctrsm_Eigen ztrsm_Eigen strsm_MKL dtrsm_MKL ctrsm_MKL ztrsm_MKL
$shell> make BLAS_FUNCTIONS=trsm
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"openBLAS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_openBLAS trsm.cc /home/numerik/lehn/work//OpenBLAS-v0.2.15-0/libopenblas_sandybridge-r0.2.15.a
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"BLIS\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_BLIS trsm.cc /home/numerik/lehn/work//blis/lib/sandybridge/libblis.a -fopenmp
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"Eigen\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_Eigen trsm.cc /home/numerik/lehn/work//EIGEN-3.2.8/blas/libeigen_blas_static.a
g++-5.3 -DTYPE="float" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o strsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
g++-5.3 -DTYPE="double" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o dtrsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ctrsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
g++-5.3 -DTYPE="std::complex" -DBLAS_LIB=\"MKL\" -DNDEBUG -std=c++11 -O3 -Wall -m64 -march=native -mfpmath=sse -mavx -DUSE_AVX -DHAVE_GCCVEC -I ../../FLENS/ -o ztrsm_MKL trsm.cc -L /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -Wl,-rpath /opt/intel/compilers_and_libraries/linux/mkl/lib/intel64 -lmkl_intel_ilp64 -lmkl_core -lmkl_sequential -lm -lpthread
$shell> ./strsm_MKL > report.strsm_MKL
$shell> ./dtrsm_MKL > report.dtrsm_MKL
$shell> ./ctrsm_MKL > report.ctrsm_MKL
$shell> ./ztrsm_MKL > report.ztrsm_MKL
$shell> ./strsm_Eigen > report.strsm_Eigen
$shell> ./dtrsm_Eigen > report.dtrsm_Eigen
$shell> ./ctrsm_Eigen > report.ctrsm_Eigen
$shell> ./ztrsm_Eigen > report.ztrsm_Eigen
$shell> ./strsm_openBLAS > report.strsm_openBLAS
$shell> ./dtrsm_openBLAS > report.dtrsm_openBLAS
$shell> ./ctrsm_openBLAS > report.ctrsm_openBLAS
$shell> ./ztrsm_openBLAS > report.ztrsm_openBLAS
$shell> ./strsm_BLIS > report.strsm_BLIS
$shell> ./dtrsm_BLIS > report.dtrsm_BLIS
$shell> ./ctrsm_BLIS > report.ctrsm_BLIS
$shell> ./ztrsm_BLIS > report.ztrsm_BLIS
$shell> gnuplot plot.strsm.mflops
$shell> gnuplot plot.dtrsm.mflops
$shell> gnuplot plot.ctrsm.mflops
$shell> gnuplot plot.ztrsm.mflops
$shell>
Single Precision
$shell> cat report.strsm_MKL
# m n k FLENS/ulmBLAS: t MFLOPS MKL: t MFLOPS Residual
50 50 0.0001 1039.99 0.0031 40.57 1.2e-02
100 100 0.0002 4353.45 0.0001 7769.16 6.5e-02
150 150 0.0004 7815.83 0.0004 9334.63 1.8e-01
200 200 0.0008 9899.64 0.0004 17873.10 3.8e-01
250 250 0.0015 10598.20 0.0010 15014.28 6.6e-01
300 300 0.0023 11883.73 0.0019 14192.44 1.0e+00
350 350 0.0015 28977.09 0.0014 30824.90 1.5e+00
400 400 0.0021 31171.84 0.0015 43787.69 2.1e+00
450 450 0.0029 31092.89 0.0024 38519.78 2.9e+00
500 500 0.0039 32313.13 0.0034 36377.79 3.8e+00
550 550 0.0050 33368.19 0.0041 40430.62 3.1e+00
600 600 0.0063 34522.65 0.0048 44930.83 3.7e+00
650 650 0.0080 34218.99 0.0063 43323.80 4.3e+00
700 700 0.0098 35110.37 0.0079 43180.97 5.1e+00
750 750 0.0118 35865.52 0.0099 42715.77 6.0e+00
800 800 0.0139 36784.86 0.0108 47391.69 6.8e+00
850 850 0.0170 36161.23 0.0133 46125.20 7.5e+00
900 900 0.0199 36696.24 0.0159 45766.73 8.5e+00
950 950 0.0231 37153.58 0.0189 45271.28 9.5e+00
1000 1000 0.0266 37656.60 0.0206 48585.50 1.1e+01
1050 1050 0.0311 37164.41 0.0251 46201.82 1.2e+01
1100 1100 0.0354 37568.47 0.0287 46454.91 1.3e+01
1150 1150 0.0401 37926.81 0.0329 46162.56 1.4e+01
1200 1200 0.0449 38477.95 0.0356 48593.62 1.5e+01
1250 1250 0.0515 37935.10 0.0410 47691.62 1.7e+01
1300 1300 0.0575 38184.60 0.0456 48167.46 1.8e+01
1350 1350 0.0640 38446.56 0.0515 47806.23 2.0e+01
1400 1400 0.0704 38961.63 0.0555 49479.63 2.1e+01
1450 1450 0.0788 38669.81 0.0623 48972.57 2.3e+01
1500 1500 0.0865 39000.73 0.0689 48971.50 2.5e+01
1550 1550 0.0951 39153.65 0.0763 48833.90 2.6e+01
1600 1600 0.1032 39679.61 0.0816 50205.25 2.8e+01
1650 1650 0.1145 39237.67 0.0904 49671.81 2.9e+01
1700 1700 0.1247 39389.56 0.0988 49711.47 3.1e+01
1750 1750 0.1353 39610.83 0.1086 49328.59 3.4e+01
1800 1800 0.1466 39788.68 0.1151 50656.29 3.6e+01
1850 1850 0.1605 39456.29 0.1261 50196.75 3.7e+01
1900 1900 0.1722 39823.29 0.1364 50300.80 3.9e+01
1950 1950 0.1859 39886.73 0.1486 49912.98 4.2e+01
2000 2000 0.1990 40195.79 0.1566 51089.42 4.4e+01
$shell> cat report.strsm_Eigen
# m n k FLENS/ulmBLAS: t MFLOPS Eigen: t MFLOPS Residual
50 50 0.0001 1224.23 0.0001 1906.10 3.6e-03
100 100 0.0002 5193.54 0.0002 4450.89 1.7e-02
150 150 0.0004 7919.58 0.0006 6001.64 4.2e-02
200 200 0.0008 10039.32 0.0011 7065.66 8.2e-02
250 250 0.0015 10690.86 0.0021 7457.60 1.4e-01
300 300 0.0023 11976.89 0.0033 8289.77 2.0e-01
350 350 0.0015 29053.89 0.0023 18602.74 2.9e-01
400 400 0.0020 31252.64 0.0032 20063.69 4.0e-01
450 450 0.0034 26863.94 0.0046 20007.09 5.3e-01
500 500 0.0038 32568.25 0.0059 21090.24 6.8e-01
550 550 0.0050 33502.84 0.0080 20833.19 8.4e-01
600 600 0.0063 34556.18 0.0100 21691.79 1.0e+00
650 650 0.0080 34328.63 0.0127 21556.81 1.3e+00
700 700 0.0098 35149.80 0.0153 22414.55 1.5e+00
750 750 0.0118 35878.74 0.0190 22255.00 1.8e+00
800 800 0.0140 36583.69 0.0226 22671.33 2.1e+00
850 850 0.0170 36219.77 0.0272 22594.40 2.4e+00
900 900 0.0198 36733.17 0.0315 23139.69 2.7e+00
950 950 0.0231 37076.48 0.0373 23006.87 3.1e+00
1000 1000 0.0265 37713.13 0.0426 23461.32 3.5e+00
1050 1050 0.0311 37260.07 0.0496 23353.97 4.0e+00
1100 1100 0.0354 37629.44 0.0559 23798.00 4.5e+00
1150 1150 0.0401 37973.69 0.0644 23620.37 5.0e+00
1200 1200 0.0449 38500.75 0.0718 24052.94 5.5e+00
1250 1250 0.0514 37965.54 0.0818 23881.08 6.1e+00
1300 1300 0.0575 38206.82 0.0906 24243.37 6.7e+00
1350 1350 0.0639 38490.63 0.1020 24123.03 7.3e+00
1400 1400 0.0706 38850.52 0.1122 24447.41 8.0e+00
1450 1450 0.0789 38636.78 0.1252 24352.56 8.7e+00
1500 1500 0.0867 38924.05 0.1368 24662.20 9.5e+00
1550 1550 0.0950 39182.16 0.1521 24485.06 1.0e+01
1600 1600 0.1033 39637.56 0.1661 24663.79 1.1e+01
1650 1650 0.1145 39222.55 0.1823 24642.66 1.2e+01
1700 1700 0.1246 39438.08 0.1967 24979.27 1.3e+01
1750 1750 0.1353 39625.23 0.2164 24771.47 1.4e+01
1800 1800 0.1466 39782.52 0.2327 25063.55 1.5e+01
1850 1850 0.1600 39580.61 0.2542 24904.38 1.6e+01
1900 1900 0.1723 39819.72 0.2722 25195.14 1.7e+01
1950 1950 0.1858 39906.37 0.2964 25013.35 1.8e+01
2000 2000 0.1991 40180.78 0.3169 25247.46 1.9e+01
$shell> cat report.strsm_openBLAS
# m n k FLENS/ulmBLAS: t MFLOPS openBLAS: t MFLOPS Residual
50 50 0.0001 1224.23 0.0001 1153.24 4.9e-03
100 100 0.0002 4992.54 0.0003 3603.06 1.9e-02
150 150 0.0004 7786.87 0.0007 4780.89 4.2e-02
200 200 0.0008 10019.12 0.0013 6252.31 8.1e-02
250 250 0.0015 10674.56 0.0022 7121.24 1.3e-01
300 300 0.0010 26759.99 0.0015 18136.69 1.9e-01
350 350 0.0015 28949.82 0.0023 18943.73 2.7e-01
400 400 0.0021 30847.57 0.0030 21554.98 3.7e-01
450 450 0.0030 30757.18 0.0041 22445.52 4.7e-01
500 500 0.0039 32300.31 0.0051 24451.79 5.9e-01
550 550 0.0050 33508.51 0.0066 25106.49 7.4e-01
600 600 0.0063 34475.68 0.0081 26654.84 8.9e-01
650 650 0.0080 34199.94 0.0103 26762.31 1.1e+00
700 700 0.0099 34816.92 0.0122 28085.29 1.3e+00
750 750 0.0118 35815.78 0.0151 28015.13 1.5e+00
800 800 0.0139 36719.28 0.0174 29442.23 1.7e+00
850 850 0.0170 36198.30 0.0206 29830.19 1.9e+00
900 900 0.0198 36792.87 0.0235 31027.71 2.2e+00
950 950 0.0230 37237.65 0.0277 30919.09 2.5e+00
1000 1000 0.0265 37760.18 0.0313 31962.41 2.8e+00
1050 1050 0.0310 37304.01 0.0362 31957.12 3.2e+00
1100 1100 0.0354 37636.58 0.0404 32923.68 3.5e+00
1150 1150 0.0401 37953.58 0.0466 32659.07 3.9e+00
1200 1200 0.0449 38494.89 0.0512 33739.25 4.3e+00
1250 1250 0.0514 37976.41 0.0581 33591.92 4.7e+00
1300 1300 0.0573 38352.66 0.0633 34734.04 5.2e+00
1350 1350 0.0640 38435.62 0.0715 34418.96 5.7e+00
1400 1400 0.0703 39017.92 0.0781 35156.15 6.2e+00
1450 1450 0.0789 38648.38 0.0869 35063.81 6.7e+00
1500 1500 0.0864 39056.17 0.0941 35869.66 7.2e+00
1550 1550 0.0949 39226.50 0.1048 35530.19 7.8e+00
1600 1600 0.1033 39643.18 0.1120 36567.58 8.4e+00
1650 1650 0.1145 39229.39 0.1234 36394.11 9.1e+00
1700 1700 0.1248 39355.12 0.1324 37119.16 9.7e+00
1750 1750 0.1353 39601.20 0.1457 36782.00 1.0e+01
1800 1800 0.1467 39751.73 0.1558 37443.65 1.1e+01
1850 1850 0.1600 39574.13 0.1698 37287.93 1.2e+01
1900 1900 0.1724 39795.63 0.1811 37882.90 1.3e+01
1950 1950 0.1858 39917.67 0.1978 37480.30 1.3e+01
2000 2000 0.1989 40222.01 0.2087 38338.00 1.4e+01
$shell> cat report.strsm_BLIS
# m n k FLENS/ulmBLAS: t MFLOPS BLIS: t MFLOPS Residual
50 50 0.0002 535.55 0.0003 434.95 5.0e-03
100 100 0.0001 7681.61 0.0002 4228.76 1.9e-02
150 150 0.0003 12657.18 0.0005 6904.59 4.5e-02
200 200 0.0006 14385.10 0.0009 9103.43 8.3e-02
250 250 0.0010 16344.79 0.0016 9910.84 1.3e-01
300 300 0.0016 16922.84 0.0024 11266.27 2.0e-01
350 350 0.0012 37215.65 0.0016 26539.38 2.8e-01
400 400 0.0016 39197.07 0.0022 28922.75 3.8e-01
450 450 0.0024 38476.66 0.0031 29301.17 4.8e-01
500 500 0.0032 39437.28 0.0041 30838.79 6.0e-01
550 550 0.0042 39457.62 0.0050 33143.00 7.4e-01
600 600 0.0054 40184.12 0.0064 33958.98 9.1e-01
650 650 0.0070 39246.28 0.0080 34293.58 1.1e+00
700 700 0.0087 39547.09 0.0098 35121.42 1.3e+00
750 750 0.0105 40161.24 0.0115 36573.43 1.5e+00
800 800 0.0125 41017.34 0.0137 37290.62 1.7e+00
850 850 0.0158 38750.41 0.0166 37057.44 2.0e+00
900 900 0.0179 40689.03 0.0192 37922.50 2.2e+00
950 950 0.0209 40939.05 0.0222 38556.74 2.5e+00
1000 1000 0.0242 41345.41 0.0254 39387.83 2.9e+00
1050 1050 0.0282 41087.77 0.0297 38974.78 3.2e+00
1100 1100 0.0328 40579.05 0.0333 39926.24 3.6e+00
1150 1150 0.0366 41552.70 0.0376 40435.03 4.0e+00
1200 1200 0.0421 41085.83 0.0422 40932.15 4.4e+00
1250 1250 0.0471 41446.98 0.0476 41009.92 4.8e+00
1300 1300 0.0532 41294.74 0.0531 41401.80 5.2e+00
1350 1350 0.0589 41801.53 0.0587 41923.65 5.7e+00
1400 1400 0.0649 42267.55 0.0647 42400.93 6.2e+00
1450 1450 0.0732 41655.59 0.0726 41992.28 6.7e+00
1500 1500 0.0805 41940.41 0.0794 42515.99 7.3e+00
1550 1550 0.0889 41905.00 0.0874 42603.62 7.9e+00
1600 1600 0.0960 42675.32 0.0947 43229.57 8.5e+00
1650 1650 0.1073 41846.89 0.1047 42922.75 9.1e+00
1700 1700 0.1172 41935.63 0.1140 43109.56 9.8e+00
1750 1750 0.1280 41862.42 0.1232 43497.38 1.0e+01
1800 1800 0.1389 41996.75 0.1335 43683.60 1.1e+01
1850 1850 0.1516 41763.62 0.1457 43462.88 1.2e+01
1900 1900 0.1629 42108.52 0.1566 43786.20 1.3e+01
1950 1950 0.1763 42047.95 0.1683 44049.94 1.4e+01
2000 2000 0.1887 42388.57 0.1808 44258.18 1.4e+01
$shell>
Double Precision
$shell> cat report.dtrsm_MKL
# m n k FLENS/ulmBLAS: t MFLOPS MKL: t MFLOPS Residual
50 50 0.0001 975.91 0.0021 58.38 2.4e-11
100 100 0.0003 3697.02 0.0001 8103.33 1.3e-10
150 150 0.0007 5093.29 0.0004 8139.67 3.5e-10
200 200 0.0013 6376.58 0.0008 10540.00 7.2e-10
250 250 0.0023 6887.33 0.0016 9593.41 1.2e-09
300 300 0.0016 16932.44 0.0012 21822.18 1.2e-09
350 350 0.0025 17493.28 0.0018 23183.01 1.7e-09
400 400 0.0034 18588.79 0.0028 23138.82 2.3e-09
450 450 0.0049 18680.84 0.0039 23282.60 2.8e-09
500 500 0.0064 19568.82 0.0052 23871.95 3.6e-09
550 550 0.0084 19838.89 0.0072 23262.16 4.3e-09
600 600 0.0106 20408.28 0.0090 24018.31 5.1e-09
650 650 0.0135 20288.32 0.0114 24137.94 6.1e-09
700 700 0.0165 20753.94 0.0142 24114.94 7.0e-09
750 750 0.0203 20753.19 0.0175 24121.71 8.2e-09
800 800 0.0241 21216.22 0.0217 23560.37 9.2e-09
850 850 0.0292 21049.13 0.0258 23841.47 1.0e-08
900 900 0.0341 21384.90 0.0304 24019.11 1.2e-08
950 950 0.0399 21505.20 0.0355 24118.94 1.3e-08
1000 1000 0.0461 21687.99 0.0410 24366.62 1.5e-08
1050 1050 0.0539 21496.82 0.0476 24307.07 1.6e-08
1100 1100 0.0609 21859.38 0.0546 24385.42 1.8e-08
1150 1150 0.0694 21904.55 0.0635 23950.87 2.0e-08
1200 1200 0.0783 22057.06 0.0702 24622.80 2.1e-08
1250 1250 0.0890 21953.20 0.0785 24892.86 2.3e-08
1300 1300 0.0992 22143.19 0.0890 24678.79 2.5e-08
1350 1350 0.1111 22139.52 0.0992 24812.88 2.7e-08
1400 1400 0.1232 22274.68 0.1113 24649.93 2.9e-08
1450 1450 0.1375 22165.91 0.1222 24955.23 3.2e-08
1500 1500 0.1512 22314.25 0.1355 24900.40 3.4e-08
1550 1550 0.1674 22244.49 0.1500 24819.01 3.6e-08
1600 1600 0.1828 22402.99 0.1726 23730.31 3.9e-08
1650 1650 0.2010 22348.67 0.1799 24970.19 4.1e-08
1700 1700 0.2184 22495.73 0.2000 24567.65 4.4e-08
1750 1750 0.2385 22472.43 0.2153 24888.76 4.7e-08
1800 1800 0.2585 22558.83 0.2380 24499.88 5.0e-08
1850 1850 0.2816 22485.51 0.2559 24747.20 5.2e-08
1900 1900 0.3032 22623.46 0.2921 23484.69 5.6e-08
1950 1950 0.3285 22571.13 0.3006 24667.00 5.9e-08
2000 2000 0.3545 22564.67 0.3284 24359.83 6.2e-08
$shell> cat report.dtrsm_Eigen
# m n k FLENS/ulmBLAS: t MFLOPS Eigen: t MFLOPS Residual
50 50 0.0001 1088.70 0.0001 1552.33 1.1e-11
100 100 0.0003 3781.98 0.0003 3167.84 4.7e-11
150 150 0.0007 5122.46 0.0009 3802.44 1.1e-10
200 200 0.0006 14120.88 0.0009 9387.69 2.1e-10
250 250 0.0010 15368.00 0.0016 10051.10 3.5e-10
300 300 0.0016 16997.97 0.0026 10368.27 5.1e-10
350 350 0.0024 17772.83 0.0040 10749.78 7.1e-10
400 400 0.0034 18970.12 0.0059 10880.76 9.6e-10
450 450 0.0048 18924.95 0.0082 11094.69 1.2e-09
500 500 0.0064 19552.77 0.0110 11365.98 1.6e-09
550 550 0.0084 19813.81 0.0146 11392.56 1.9e-09
600 600 0.0106 20338.22 0.0188 11499.33 2.3e-09
650 650 0.0136 20255.62 0.0235 11670.93 2.8e-09
700 700 0.0166 20715.68 0.0290 11844.64 3.3e-09
750 750 0.0202 20922.47 0.0352 11983.35 3.9e-09
800 800 0.0240 21322.42 0.0426 12015.50 4.5e-09
850 850 0.0291 21084.66 0.0507 12113.57 5.1e-09
900 900 0.0341 21408.01 0.0598 12186.92 5.9e-09
950 950 0.0399 21513.04 0.0701 12232.42 6.6e-09
1000 1000 0.0462 21658.62 0.0812 12320.21 7.5e-09
1050 1050 0.0535 21627.38 0.0936 12362.18 8.3e-09
1100 1100 0.0607 21913.75 0.1070 12435.49 9.3e-09
1150 1150 0.0695 21897.78 0.1218 12486.30 1.0e-08
1200 1200 0.0783 22059.27 0.1376 12561.36 1.1e-08
1250 1250 0.0888 21987.39 0.1552 12581.02 1.2e-08
1300 1300 0.0991 22177.30 0.1744 12598.24 1.4e-08
1350 1350 0.1110 22158.97 0.1950 12620.26 1.5e-08
1400 1400 0.1231 22291.93 0.2168 12656.56 1.6e-08
1450 1450 0.1374 22195.69 0.2403 12686.53 1.8e-08
1500 1500 0.1511 22342.79 0.2658 12695.50 1.9e-08
1550 1550 0.1674 22249.63 0.2934 12691.54 2.1e-08
1600 1600 0.1827 22424.81 0.3241 12639.83 2.2e-08
1650 1650 0.2008 22374.39 0.3516 12774.53 2.4e-08
1700 1700 0.2182 22515.21 0.3843 12782.67 2.6e-08
1750 1750 0.2385 22470.64 0.4192 12784.16 2.7e-08
1800 1800 0.2586 22550.25 0.4551 12815.74 2.9e-08
1850 1850 0.2812 22514.31 0.4940 12817.49 3.1e-08
1900 1900 0.3030 22634.55 0.5348 12826.16 3.3e-08
1950 1950 0.3283 22588.96 0.5783 12822.18 3.5e-08
2000 2000 0.3537 22617.46 0.6224 12853.55 3.8e-08
$shell> cat report.dtrsm_openBLAS
# m n k FLENS/ulmBLAS: t MFLOPS openBLAS: t MFLOPS Residual
50 50 0.0001 1102.79 0.0001 1401.58 7.1e-12
100 100 0.0003 3769.03 0.0003 3852.18 2.7e-11
150 150 0.0007 5115.40 0.0006 5255.59 6.0e-11
200 200 0.0013 6390.81 0.0013 6363.47 1.1e-10
250 250 0.0021 7329.57 0.0010 15621.27 1.8e-10
300 300 0.0016 16630.90 0.0015 17648.24 2.7e-10
350 350 0.0024 17824.43 0.0023 18419.68 3.9e-10
400 400 0.0034 18856.52 0.0033 19325.78 5.3e-10
450 450 0.0048 18893.18 0.0046 19664.53 7.0e-10
500 500 0.0064 19518.87 0.0063 19855.82 8.9e-10
550 550 0.0084 19819.58 0.0082 20185.52 1.1e-09
600 600 0.0106 20323.67 0.0105 20661.87 1.4e-09
650 650 0.0136 20207.51 0.0131 21043.78 1.6e-09
700 700 0.0166 20683.23 0.0160 21376.79 1.9e-09
750 750 0.0203 20811.25 0.0195 21603.23 2.3e-09
800 800 0.0241 21229.67 0.0234 21905.57 2.7e-09
850 850 0.0292 21055.33 0.0276 22219.98 3.0e-09
900 900 0.0341 21382.49 0.0323 22547.83 3.5e-09
950 950 0.0399 21502.27 0.0378 22654.52 3.9e-09
1000 1000 0.0461 21700.74 0.0436 22912.15 4.4e-09
1050 1050 0.0536 21591.60 0.0500 23151.50 4.9e-09
1100 1100 0.0609 21847.33 0.0570 23341.70 5.5e-09
1150 1150 0.0695 21894.50 0.0649 23422.03 6.2e-09
1200 1200 0.0784 22042.86 0.0733 23560.21 6.8e-09
1250 1250 0.0890 21953.01 0.0823 23742.38 7.5e-09
1300 1300 0.0992 22136.35 0.0921 23849.65 8.3e-09
1350 1350 0.1112 22120.47 0.1029 23906.07 9.1e-09
1400 1400 0.1233 22256.31 0.1145 23970.56 9.9e-09
1450 1450 0.1376 22149.35 0.1263 24141.64 1.1e-08
1500 1500 0.1510 22345.99 0.1392 24252.14 1.2e-08
1550 1550 0.1674 22239.44 0.1538 24207.08 1.3e-08
1600 1600 0.1829 22398.55 0.1686 24301.15 1.4e-08
1650 1650 0.2011 22341.68 0.1836 24464.18 1.5e-08
1700 1700 0.2185 22487.36 0.2002 24544.29 1.6e-08
1750 1750 0.2388 22445.27 0.2180 24580.00 1.7e-08
1800 1800 0.2586 22550.56 0.2377 24532.36 1.8e-08
1850 1850 0.2817 22477.02 0.2562 24712.74 1.9e-08
1900 1900 0.3030 22639.50 0.2770 24758.46 2.1e-08
1950 1950 0.3290 22534.40 0.2992 24782.83 2.2e-08
2000 2000 0.3539 22605.70 0.3232 24752.33 2.3e-08
$shell> cat report.dtrsm_BLIS
# m n k FLENS/ulmBLAS: t MFLOPS BLIS: t MFLOPS Residual
50 50 0.0002 613.80 0.0003 475.01 7.2e-12
100 100 0.0001 11537.88 0.0002 6324.43 2.9e-11
150 150 0.0002 19716.43 0.0004 9432.99 6.4e-11
200 200 0.0004 22714.37 0.0007 11974.56 1.1e-10
250 250 0.0007 23083.79 0.0012 13121.10 1.8e-10
300 300 0.0011 24571.10 0.0019 14430.28 2.9e-10
350 350 0.0017 25257.49 0.0028 15510.97 4.0e-10
400 400 0.0024 26124.34 0.0039 16464.94 5.5e-10
450 450 0.0037 24851.09 0.0055 16694.78 7.1e-10
500 500 0.0049 25322.20 0.0072 17293.63 9.0e-10
550 550 0.0067 24971.19 0.0093 17937.72 1.1e-09
600 600 0.0086 25192.53 0.0116 18604.51 1.4e-09
650 650 0.0112 24520.09 0.0146 18757.64 1.7e-09
700 700 0.0138 24788.02 0.0177 19328.18 2.0e-09
750 750 0.0167 25305.39 0.0213 19800.48 2.3e-09
800 800 0.0202 25329.57 0.0255 20058.75 2.7e-09
850 850 0.0250 24539.94 0.0305 20124.63 3.1e-09
900 900 0.0293 24840.49 0.0357 20417.06 3.5e-09
950 950 0.0343 24991.58 0.0413 20744.09 4.0e-09
1000 1000 0.0398 25124.99 0.0478 20918.15 4.5e-09
1050 1050 0.0471 24599.51 0.0553 20914.91 5.0e-09
1100 1100 0.0535 24859.49 0.0630 21130.84 5.6e-09
1150 1150 0.0607 25070.80 0.0714 21304.57 6.2e-09
1200 1200 0.0695 24847.49 0.0803 21524.69 6.9e-09
1250 1250 0.0789 24759.12 0.0910 21461.24 7.6e-09
1300 1300 0.0887 24775.59 0.1016 21632.31 8.3e-09
1350 1350 0.0990 24856.99 0.1131 21755.11 9.2e-09
1400 1400 0.1103 24868.24 0.1256 21847.49 1.0e-08
1450 1450 0.1239 24608.77 0.1398 21814.69 1.1e-08
1500 1500 0.1361 24799.21 0.1535 21991.72 1.2e-08
1550 1550 0.1517 24551.20 0.1687 22079.59 1.3e-08
1600 1600 0.1657 24718.34 0.1845 22198.68 1.4e-08
1650 1650 0.1833 24510.48 0.2028 22150.90 1.5e-08
1700 1700 0.1994 24634.52 0.2211 22220.56 1.6e-08
1750 1750 0.2180 24586.84 0.2398 22348.65 1.7e-08
1800 1800 0.2368 24632.76 0.2606 22381.26 1.8e-08
1850 1850 0.2579 24554.29 0.2828 22390.50 1.9e-08
1900 1900 0.2794 24551.58 0.3053 22463.17 2.1e-08
1950 1950 0.3027 24493.56 0.3290 22538.18 2.2e-08
2000 2000 0.3271 24454.91 0.3540 22600.88 2.3e-08
$shell>
Complex Single Precision
$shell> cat report.ctrsm_MKL
# m n k FLENS/ulmBLAS: t MFLOPS MKL: t MFLOPS Residual
50 50 0.0002 593.05 0.0021 59.03 2.9e-02
100 100 0.0005 1840.44 0.0002 4584.88 1.6e-01
150 150 0.0013 2545.17 0.0008 4117.33 4.4e-01
200 200 0.0026 3103.29 0.0014 5638.35 9.2e-01
250 250 0.0022 7181.35 0.0014 11266.38 1.6e+00
300 300 0.0034 7895.47 0.0023 11878.25 1.6e+00
350 350 0.0051 8457.79 0.0037 11734.42 2.2e+00
400 400 0.0071 9024.29 0.0051 12434.21 2.9e+00
450 450 0.0101 8990.43 0.0074 12282.38 3.6e+00
500 500 0.0134 9330.21 0.0099 12646.96 4.6e+00
550 550 0.0174 9554.47 0.0137 12183.95 5.5e+00
600 600 0.0219 9852.68 0.0172 12579.42 6.6e+00
650 650 0.0281 9773.69 0.0221 12410.22 7.8e+00
700 700 0.0344 9975.37 0.0272 12613.09 9.0e+00
750 750 0.0417 10120.40 0.0337 12508.78 1.0e+01
800 800 0.0495 10345.87 0.0397 12892.09 1.2e+01
850 850 0.0599 10245.33 0.0484 12694.55 1.3e+01
900 900 0.0702 10386.22 0.0567 12855.68 1.5e+01
950 950 0.0815 10516.89 0.0666 12870.20 1.7e+01
1000 1000 0.0936 10681.44 0.0766 13057.96 1.9e+01
1050 1050 0.1094 10578.16 0.0903 12813.23 2.1e+01
1100 1100 0.1244 10695.12 0.1030 12925.01 2.3e+01
1150 1150 0.1411 10779.89 0.1182 12866.24 2.5e+01
1200 1200 0.1586 10895.20 0.1328 13013.05 2.7e+01
1250 1250 0.1808 10802.29 0.1507 12958.38 2.9e+01
1300 1300 0.2018 10886.26 0.1683 13052.64 3.2e+01
1350 1350 0.2247 10947.24 0.1890 13016.69 3.4e+01
1400 1400 0.2488 11029.94 0.2093 13109.54 3.7e+01
1450 1450 0.2782 10959.38 0.2333 13066.15 4.0e+01
1500 1500 0.3060 11029.79 0.2569 13138.78 4.3e+01
1550 1550 0.3373 11041.03 0.2869 12980.21 4.6e+01
1600 1600 0.3673 11152.39 0.3133 13072.18 4.9e+01
1650 1650 0.4050 11090.71 0.3444 13043.91 5.2e+01
1700 1700 0.4411 11138.24 0.3758 13074.08 5.5e+01
1750 1750 0.4794 11178.30 0.4109 13043.69 5.9e+01
1800 1800 0.5205 11204.84 0.4451 13103.79 6.2e+01
1850 1850 0.5661 11183.80 0.4842 13076.29 6.6e+01
1900 1900 0.6124 11200.21 0.5232 13109.87 7.0e+01
1950 1950 0.6583 11264.40 0.5667 13084.32 7.3e+01
2000 2000 0.7074 11308.72 0.6090 13135.44 7.7e+01
$shell> cat report.ctrsm_Eigen
# m n k FLENS/ulmBLAS: t MFLOPS Eigen: t MFLOPS Residual
50 50 0.0002 663.63 0.0003 414.60 1.3e-02
100 100 0.0006 1737.69 0.0013 777.38 5.4e-02
150 150 0.0013 2513.01 0.0033 1036.51 1.3e-01
200 200 0.0012 6884.76 0.0029 2759.88 2.3e-01
250 250 0.0022 7230.56 0.0050 3141.41 3.8e-01
300 300 0.0034 7940.39 0.0079 3431.00 5.5e-01
350 350 0.0051 8441.97 0.0116 3700.79 7.6e-01
400 400 0.0071 9010.62 0.0164 3899.83 1.0e+00
450 450 0.0101 8981.02 0.0224 4076.16 1.3e+00
500 500 0.0134 9313.41 0.0294 4244.72 1.6e+00
550 550 0.0174 9543.14 0.0378 4396.17 2.0e+00
600 600 0.0219 9859.02 0.0478 4516.02 2.5e+00
650 650 0.0281 9762.78 0.0592 4635.94 2.9e+00
700 700 0.0345 9943.38 0.0724 4738.96 3.5e+00
750 750 0.0417 10119.16 0.0872 4838.92 4.0e+00
800 800 0.0496 10332.44 0.1041 4917.36 4.7e+00
850 850 0.0600 10236.32 0.1228 5002.59 5.3e+00
900 900 0.0702 10382.57 0.1439 5067.72 6.1e+00
950 950 0.0818 10484.97 0.1669 5138.19 6.9e+00
1000 1000 0.0939 10650.04 0.1926 5193.18 7.7e+00
1050 1050 0.1095 10572.42 0.2203 5254.09 8.6e+00
1100 1100 0.1246 10686.29 0.2510 5302.80 9.6e+00
1150 1150 0.1411 10778.44 0.2839 5356.58 1.1e+01
1200 1200 0.1586 10896.11 0.3199 5400.99 1.2e+01
1250 1250 0.1808 10803.17 0.3587 5444.26 1.3e+01
1300 1300 0.2019 10880.47 0.4008 5481.59 1.4e+01
1350 1350 0.2247 10947.63 0.4460 5516.84 1.5e+01
1400 1400 0.2487 11035.53 0.4940 5554.40 1.7e+01
1450 1450 0.2784 10952.17 0.5454 5589.44 1.8e+01
1500 1500 0.3059 11031.75 0.6008 5617.20 2.0e+01
1550 1550 0.3372 11044.24 0.6594 5647.20 2.1e+01
1600 1600 0.3673 11152.34 0.7225 5669.55 2.3e+01
1650 1650 0.4050 11092.16 0.7880 5700.57 2.4e+01
1700 1700 0.4413 11132.78 0.8583 5723.98 2.6e+01
1750 1750 0.4792 11185.04 0.9330 5743.95 2.8e+01
1800 1800 0.5206 11201.78 1.0105 5771.54 3.0e+01
1850 1850 0.5665 11175.89 1.0961 5776.60 3.2e+01
1900 1900 0.6123 11201.20 1.1826 5799.71 3.4e+01
1950 1950 0.6585 11259.56 1.2752 5814.83 3.6e+01
2000 2000 0.7073 11310.03 1.3715 5833.09 3.8e+01
$shell> cat report.ctrsm_openBLAS
# m n k FLENS/ulmBLAS: t MFLOPS openBLAS: t MFLOPS Residual
50 50 0.0002 709.68 0.0001 876.08 5.7e-03
100 100 0.0005 1829.38 0.0006 1774.74 2.4e-02
150 150 0.0013 2506.62 0.0015 2246.95 5.7e-02
200 200 0.0019 4143.86 0.0013 6059.50 1.1e-01
250 250 0.0022 7247.42 0.0024 6442.84 1.8e-01
300 300 0.0034 7929.64 0.0039 6950.26 2.6e-01
350 350 0.0051 8399.13 0.0059 7275.19 3.8e-01
400 400 0.0072 8884.39 0.0083 7726.26 5.0e-01
450 450 0.0102 8950.10 0.0115 7921.49 6.6e-01
500 500 0.0135 9288.08 0.0155 8057.47 8.4e-01
550 550 0.0175 9508.10 0.0199 8339.74 1.1e+00
600 600 0.0220 9834.25 0.0251 8602.62 1.3e+00
650 650 0.0282 9745.86 0.0310 8855.60 1.6e+00
700 700 0.0345 9947.97 0.0379 9056.13 1.9e+00
750 750 0.0418 10102.35 0.0458 9208.33 2.2e+00
800 800 0.0495 10345.04 0.0533 9599.16 2.6e+00
850 850 0.0601 10217.13 0.0632 9721.67 2.9e+00
900 900 0.0702 10386.18 0.0744 9798.21 3.4e+00
950 950 0.0817 10490.53 0.0868 9877.93 3.8e+00
1000 1000 0.0939 10652.60 0.0996 10042.12 4.3e+00
1050 1050 0.1096 10559.21 0.1144 10121.76 4.9e+00
1100 1100 0.1249 10655.63 0.1304 10203.27 5.4e+00
1150 1150 0.1415 10746.71 0.1480 10278.03 6.1e+00
1200 1200 0.1591 10860.38 0.1658 10422.11 6.7e+00
1250 1250 0.1812 10777.62 0.1852 10545.79 7.4e+00
1300 1300 0.2024 10854.94 0.2083 10547.52 8.2e+00
1350 1350 0.2253 10920.07 0.2321 10601.53 8.9e+00
1400 1400 0.2495 10997.69 0.2557 10733.39 9.8e+00
1450 1450 0.2790 10925.10 0.2825 10793.32 1.1e+01
1500 1500 0.3070 10992.50 0.3122 10809.01 1.1e+01
1550 1550 0.3384 11004.79 0.3439 10828.26 1.2e+01
1600 1600 0.3684 11118.87 0.3741 10947.90 1.3e+01
1650 1650 0.4063 11055.49 0.4074 11025.70 1.4e+01
1700 1700 0.4428 11094.58 0.4451 11039.11 1.6e+01
1750 1750 0.4803 11158.31 0.4840 11073.49 1.7e+01
1800 1800 0.5221 11171.08 0.5223 11166.61 1.8e+01
1850 1850 0.5680 11148.15 0.5670 11166.74 1.9e+01
1900 1900 0.6143 11166.29 0.6145 11161.97 2.0e+01
1950 1950 0.6602 11231.32 0.6630 11184.63 2.2e+01
2000 2000 0.7094 11277.49 0.7096 11274.25 2.3e+01
$shell> cat report.ctrsm_BLIS
# m n k FLENS/ulmBLAS: t MFLOPS BLIS: t MFLOPS Residual
50 50 0.0003 435.90 0.0002 769.82 8.8e-03
100 100 0.0001 7081.40 0.0002 4155.12 3.5e-02
150 150 0.0006 5750.94 0.0009 3632.11 8.6e-02
200 200 0.0008 10324.34 0.0011 7142.32 1.6e-01
250 250 0.0015 10168.08 0.0021 7546.65 2.6e-01
300 300 0.0025 10788.07 0.0032 8321.16 3.9e-01
350 350 0.0041 10535.25 0.0048 8885.77 5.5e-01
400 400 0.0057 11320.99 0.0067 9597.31 7.3e-01
450 450 0.0083 10963.17 0.0095 9603.72 9.5e-01
500 500 0.0111 11216.68 0.0125 10007.45 1.2e+00
550 550 0.0147 11282.18 0.0161 10307.30 1.5e+00
600 600 0.0188 11514.91 0.0204 10563.54 1.8e+00
650 650 0.0245 11201.33 0.0262 10491.07 2.2e+00
700 700 0.0300 11429.30 0.0318 10779.55 2.5e+00
750 750 0.0365 11543.60 0.0384 10984.52 3.0e+00
800 800 0.0435 11771.59 0.0458 11172.11 3.4e+00
850 850 0.0530 11580.80 0.0550 11168.93 3.9e+00
900 900 0.0624 11684.45 0.0644 11314.73 4.4e+00
950 950 0.0727 11790.77 0.0748 11461.88 5.0e+00
1000 1000 0.0840 11910.15 0.0863 11591.18 5.6e+00
1050 1050 0.0983 11772.79 0.1003 11538.62 6.3e+00
1100 1100 0.1120 11879.51 0.1141 11661.53 7.0e+00
1150 1150 0.1273 11950.20 0.1296 11737.58 7.8e+00
1200 1200 0.1437 12024.34 0.1457 11857.26 8.6e+00
1250 1250 0.1644 11881.30 0.1656 11794.96 9.4e+00
1300 1300 0.1845 11908.19 0.1848 11890.29 1.0e+01
1350 1350 0.2068 11897.59 0.2060 11942.56 1.1e+01
1400 1400 0.2292 11973.79 0.2284 12016.10 1.2e+01
1450 1450 0.2572 11853.21 0.2547 11970.57 1.3e+01
1500 1500 0.2836 11899.88 0.2801 12047.74 1.4e+01
1550 1550 0.3125 11918.00 0.3095 12030.68 1.6e+01
1600 1600 0.3412 12003.04 0.3369 12159.13 1.7e+01
1650 1650 0.3776 11896.97 0.3707 12118.04 1.8e+01
1700 1700 0.4117 11934.85 0.4047 12141.26 1.9e+01
1750 1750 0.4473 11982.12 0.4410 12153.21 2.1e+01
1800 1800 0.4877 11959.13 0.4761 12250.05 2.2e+01
1850 1850 0.5307 11931.79 0.5198 12180.14 2.3e+01
1900 1900 0.5748 11933.22 0.5609 12228.05 2.5e+01
1950 1950 0.6186 11986.72 0.6049 12258.53 2.6e+01
2000 2000 0.6665 12003.36 0.6509 12290.52 2.8e+01
$shell>
Complex Double Precision
$shell> cat report.ztrsm_MKL
# m n k FLENS/ulmBLAS: t MFLOPS MKL: t MFLOPS Residual
50 50 0.0002 610.03 0.0021 58.61 5.5e-11
100 100 0.0006 1539.14 0.0004 2503.25 3.1e-10
150 150 0.0019 1766.60 0.0014 2341.00 5.3e-10
200 200 0.0017 4600.71 0.0014 5867.37 9.7e-10
250 250 0.0033 4725.58 0.0026 6126.34 1.5e-09
300 300 0.0053 5057.52 0.0044 6070.24 2.2e-09
350 350 0.0085 5063.84 0.0070 6110.50 2.9e-09
400 400 0.0121 5291.36 0.0104 6128.91 3.9e-09
450 450 0.0174 5244.08 0.0149 6120.53 5.0e-09
500 500 0.0231 5417.16 0.0203 6152.73 6.1e-09
550 550 0.0310 5370.95 0.0272 6125.89 7.3e-09
600 600 0.0393 5493.74 0.0351 6148.72 8.7e-09
650 650 0.0504 5448.28 0.0442 6206.95 1.0e-08
700 700 0.0617 5556.33 0.0551 6227.74 1.2e-08
750 750 0.0761 5543.13 0.0671 6286.01 1.4e-08
800 800 0.0907 5646.11 0.0822 6228.96 1.6e-08
850 850 0.1096 5601.22 0.0980 6267.92 1.8e-08
900 900 0.1282 5684.25 0.1162 6272.92 2.0e-08
950 950 0.1518 5648.57 0.1358 6311.31 2.2e-08
1000 1000 0.1752 5708.27 0.1588 6296.72 2.4e-08
1050 1050 0.2041 5671.46 0.1842 6283.08 2.7e-08
1100 1100 0.2325 5724.45 0.2119 6279.82 3.0e-08
1150 1150 0.2668 5699.66 0.2406 6321.95 3.2e-08
1200 1200 0.3014 5734.00 0.2741 6305.40 3.5e-08
1250 1250 0.3421 5709.34 0.3079 6343.69 3.8e-08
1300 1300 0.3823 5746.42 0.3496 6284.59 4.1e-08
1350 1350 0.4301 5720.09 0.3907 6297.41 4.5e-08
1400 1400 0.4762 5762.61 0.4356 6299.58 4.8e-08
1450 1450 0.5333 5716.16 0.4816 6330.36 5.1e-08
1500 1500 0.5858 5761.57 0.5350 6308.37 5.5e-08
1550 1550 0.6506 5723.57 0.5894 6317.83 5.9e-08
1600 1600 0.7056 5805.18 0.6501 6300.94 6.3e-08
1650 1650 0.7824 5741.20 0.7088 6337.42 6.7e-08
1700 1700 0.8535 5756.47 0.7772 6321.05 7.1e-08
1750 1750 0.9335 5741.28 0.8428 6359.35 7.5e-08
1800 1800 1.0109 5768.83 0.9237 6314.08 8.0e-08
1850 1850 1.0991 5760.57 0.9971 6349.87 8.4e-08
1900 1900 1.1892 5767.55 1.0850 6321.59 8.8e-08
1950 1950 1.2864 5764.19 1.1663 6357.38 9.3e-08
2000 2000 1.3911 5750.77 1.2641 6328.66 9.8e-08
$shell> cat report.ztrsm_Eigen
# m n k FLENS/ulmBLAS: t MFLOPS Eigen: t MFLOPS Residual
50 50 0.0002 650.85 0.0003 400.59 2.9e-11
100 100 0.0006 1547.12 0.0015 652.54 1.2e-10
150 150 0.0019 1773.14 0.0022 1551.77 2.9e-10
200 200 0.0017 4628.23 0.0041 1930.90 5.2e-10
250 250 0.0033 4673.46 0.0074 2105.87 8.2e-10
300 300 0.0053 5074.11 0.0119 2266.13 1.2e-09
350 350 0.0085 5060.54 0.0180 2379.98 1.6e-09
400 400 0.0121 5283.55 0.0263 2435.63 2.1e-09
450 450 0.0174 5246.83 0.0363 2507.22 2.7e-09
500 500 0.0231 5414.99 0.0486 2573.01 3.3e-09
550 550 0.0310 5367.43 0.0630 2639.13 4.0e-09
600 600 0.0393 5498.24 0.0805 2683.03 4.7e-09
650 650 0.0504 5448.63 0.1013 2710.51 5.6e-09
700 700 0.0618 5552.54 0.1246 2753.66 6.5e-09
750 750 0.0761 5540.65 0.1511 2792.07 7.5e-09
800 800 0.0907 5646.20 0.1815 2821.45 8.5e-09
850 850 0.1097 5596.82 0.2152 2854.30 9.6e-09
900 900 0.1284 5679.33 0.2537 2873.79 1.1e-08
950 950 0.1518 5649.51 0.2960 2896.06 1.2e-08
1000 1000 0.1751 5710.50 0.3430 2915.43 1.3e-08
1050 1050 0.2043 5667.34 0.3947 2933.09 1.5e-08
1100 1100 0.2325 5724.76 0.4515 2947.80 1.6e-08
1150 1150 0.2668 5700.91 0.5134 2962.26 1.8e-08
1200 1200 0.3015 5732.18 0.5799 2979.69 1.9e-08
1250 1250 0.3422 5707.21 0.6534 2989.03 2.1e-08
1300 1300 0.3828 5739.83 0.7349 2989.36 2.2e-08
1350 1350 0.4306 5714.12 0.8204 2999.08 2.4e-08
1400 1400 0.4766 5757.84 0.9116 3010.16 2.6e-08
1450 1450 0.5333 5716.02 1.0092 3020.95 2.8e-08
1500 1500 0.5861 5758.70 1.1143 3028.70 3.0e-08
1550 1550 0.6509 5721.14 1.2207 3050.66 3.2e-08
1600 1600 0.7061 5801.24 1.3445 3046.54 3.4e-08
1650 1650 0.7827 5738.97 1.4636 3069.15 3.6e-08
1700 1700 0.8544 5750.23 1.5986 3073.32 3.8e-08
1750 1750 0.9342 5736.87 1.7399 3080.24 4.1e-08
1800 1800 1.0121 5762.43 1.8892 3087.05 4.3e-08
1850 1850 1.1014 5748.91 2.0473 3092.72 4.6e-08
1900 1900 1.1915 5756.68 2.2155 3095.98 4.8e-08
1950 1950 1.2883 5755.77 2.3897 3102.91 5.0e-08
2000 2000 1.3900 5755.27 2.5733 3108.80 5.3e-08
$shell> cat report.ztrsm_openBLAS
# m n k FLENS/ulmBLAS: t MFLOPS openBLAS: t MFLOPS Residual
50 50 0.0002 657.54 0.0002 663.14 1.7e-11
100 100 0.0006 1546.11 0.0009 1078.04 6.8e-11
150 150 0.0019 1768.93 0.0028 1212.28 1.5e-10
200 200 0.0017 4631.79 0.0028 2887.68 2.8e-10
250 250 0.0033 4669.56 0.0051 3077.41 4.5e-10
300 300 0.0053 5074.18 0.0086 3131.32 6.8e-10
350 350 0.0085 5058.41 0.0135 3165.46 9.5e-10
400 400 0.0121 5279.83 0.0202 3167.67 1.3e-09
450 450 0.0175 5213.30 0.0285 3197.81 1.7e-09
500 500 0.0231 5414.07 0.0388 3222.01 2.1e-09
550 550 0.0310 5367.38 0.0513 3244.77 2.6e-09
600 600 0.0393 5501.94 0.0664 3255.29 3.2e-09
650 650 0.0504 5448.19 0.0841 3266.19 3.9e-09
700 700 0.0617 5556.06 0.1044 3285.78 4.6e-09
750 750 0.0758 5562.43 0.1280 3297.14 5.4e-09
800 800 0.0907 5647.28 0.1548 3306.62 6.3e-09
850 850 0.1098 5593.84 0.1851 3317.57 7.3e-09
900 900 0.1283 5684.20 0.2192 3325.41 8.3e-09
950 950 0.1517 5651.34 0.2576 3328.63 9.5e-09
1000 1000 0.1750 5714.03 0.2998 3335.72 1.1e-08
1050 1050 0.2041 5670.51 0.3465 3340.45 1.2e-08
1100 1100 0.2321 5734.50 0.3977 3347.11 1.3e-08
1150 1150 0.2669 5699.11 0.4540 3350.27 1.5e-08
1200 1200 0.3012 5737.43 0.5153 3353.62 1.7e-08
1250 1250 0.3422 5708.18 0.5820 3356.00 1.8e-08
1300 1300 0.3822 5748.69 0.6537 3360.68 2.0e-08
1350 1350 0.4299 5723.47 0.7320 3361.27 2.2e-08
1400 1400 0.4765 5758.62 0.8155 3364.72 2.4e-08
1450 1450 0.5330 5720.00 0.9057 3365.98 2.6e-08
1500 1500 0.5861 5758.57 1.0016 3369.73 2.8e-08
1550 1550 0.6506 5723.82 1.1045 3371.70 3.1e-08
1600 1600 0.7051 5809.48 1.2132 3376.31 3.3e-08
1650 1650 0.7828 5738.89 1.3307 3375.70 3.6e-08
1700 1700 0.8529 5760.25 1.4520 3383.52 3.8e-08
1750 1750 0.9337 5740.10 1.5844 3382.52 4.1e-08
1800 1800 1.0118 5764.03 1.7218 3387.08 4.4e-08
1850 1850 1.0996 5758.37 1.8690 3387.66 4.7e-08
1900 1900 1.1882 5772.58 2.0230 3390.43 5.0e-08
1950 1950 1.2862 5764.78 2.1875 3389.61 5.4e-08
2000 2000 1.3905 5753.51 2.3576 3393.21 5.7e-08
$shell> cat report.ztrsm_BLIS
# m n k FLENS/ulmBLAS: t MFLOPS BLIS: t MFLOPS Residual
50 50 0.0003 425.54 0.0003 411.55 1.2e-11
100 100 0.0004 2628.22 0.0005 2016.70 5.0e-11
150 150 0.0007 4945.28 0.0009 3947.82 1.3e-10
200 200 0.0014 5732.88 0.0018 4550.81 2.5e-10
250 250 0.0028 5626.25 0.0033 4803.81 4.1e-10
300 300 0.0046 5848.82 0.0053 5088.94 6.2e-10
350 350 0.0076 5636.85 0.0082 5235.32 8.9e-10
400 400 0.0109 5881.22 0.0117 5487.98 1.2e-09
450 450 0.0158 5765.38 0.0164 5550.37 1.6e-09
500 500 0.0210 5962.46 0.0219 5712.50 2.0e-09
550 550 0.0287 5793.41 0.0290 5737.99 2.5e-09
600 600 0.0364 5933.06 0.0370 5842.52 3.1e-09
650 650 0.0465 5903.52 0.0467 5882.85 3.7e-09
700 700 0.0571 6003.13 0.0584 5871.68 4.5e-09
750 750 0.0716 5889.71 0.0708 5957.79 5.3e-09
800 800 0.0850 6022.18 0.0850 6021.02 6.2e-09
850 850 0.1031 5955.45 0.1022 6006.54 7.1e-09
900 900 0.1206 6043.33 0.1198 6084.06 8.2e-09
950 950 0.1430 5996.65 0.1411 6076.26 9.3e-09
1000 1000 0.1656 6038.99 0.1636 6112.13 1.0e-08
1050 1050 0.1951 5934.76 0.1897 6102.55 1.2e-08
1100 1100 0.2210 6023.05 0.2168 6140.27 1.3e-08
1150 1150 0.2542 5982.20 0.2480 6131.82 1.5e-08
1200 1200 0.2867 6027.10 0.2803 6164.79 1.6e-08
1250 1250 0.3278 5959.06 0.3170 6161.90 1.8e-08
1300 1300 0.3663 5997.60 0.3549 6189.64 2.0e-08
1350 1350 0.4130 5956.83 0.3986 6173.15 2.2e-08
1400 1400 0.4575 5997.90 0.4419 6210.24 2.4e-08
1450 1450 0.5126 5946.85 0.4927 6187.71 2.6e-08
1500 1500 0.5624 6000.81 0.5429 6216.75 2.8e-08
1550 1550 0.6268 5941.05 0.5997 6209.40 3.0e-08
1600 1600 0.6811 6013.96 0.6560 6243.51 3.3e-08
1650 1650 0.7539 5958.64 0.7216 6225.09 3.5e-08
1700 1700 0.8278 5935.14 0.7867 6244.83 3.8e-08
1750 1750 0.9013 5946.22 0.8593 6236.91 4.1e-08
1800 1800 0.9798 5951.97 0.9319 6258.19 4.4e-08
1850 1850 1.0641 5950.19 1.0137 6246.12 4.7e-08
1900 1900 1.1527 5950.42 1.0965 6255.14 5.0e-08
1950 1950 1.2478 5942.41 1.1867 6248.18 5.3e-08
2000 2000 1.3503 5924.59 1.2788 6255.90 5.6e-08
$shell>