1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
|
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,512,512,1,512,512,1232.49, 24.072, 108.9,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,512,512,1,512,512,1017.57, 39.7489, 131.9,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,512,512,'(1:0)',512,512,3169.25, 30.9497, 169.4,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,512,512,'(1:0)',512,512,2572.45, 50.2432, 208.7,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,1024,1024,1,1024,1024,3921.63, 38.2972, 273.8,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,1024,1024,1,1024,1024,3275.6, 63.9766, 327.8,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,1024,1024,'(1:0)',1024,1024,8224.76, 40.1599, 522.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,1024,1024,'(1:0)',1024,1024,6314.27, 61.6628, 680.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,1536,1536,1,1536,1536,5471.66, 35.6228, 662.3,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,1536,1536,1,1536,1536,3892.46, 50.6831, 931,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,1536,1536,'(1:0)',1536,1536,7417.62, 24.1459, 1954.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,1536,1536,'(1:0)',1536,1536,7656.62, 49.8478, 1893.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,2048,2048,1,2048,2048,7086.24, 34.6008, 1212.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,2048,2048,1,2048,2048,5653.88, 55.2136, 1519.3,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,2048,2048,'(1:0)',2048,2048,10280.6, 25.0991, 3342.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,2048,2048,'(1:0)',2048,2048,9255.65, 45.1936, 3712.3,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,2560,2560,1,2560,2560,8796.32, 34.3606, 1907.3,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,2560,2560,1,2560,2560,7281.15, 56.884, 2304.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,2560,2560,'(1:0)',2560,2560,11973.7, 23.3861, 5604.7,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,2560,2560,'(1:0)',2560,2560,10822.1, 42.2738, 6201.1,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,3072,3072,1,3072,3072,11111.9, 36.1717, 2609,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,3072,3072,1,3072,3072,9341.1, 60.8144, 3103.6,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,3072,3072,'(1:0)',3072,3072,12824.9, 20.8739, 9042.1,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,3072,3072,'(1:0)',3072,3072,13107.1, 42.6665, 8847.4,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,3584,3584,1,3584,3584,12145.9, 33.8893, 3790.3,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,3584,3584,1,3584,3584,11127.8, 62.0969, 4137.1,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,3584,3584,'(1:0)',3584,3584,12690.1, 17.7038, 14511.1,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,3584,3584,'(1:0)',3584,3584,13493, 37.6478, 13647.6,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,4096,4096,1,4096,4096,13550.9, 33.0833, 5071.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,4096,4096,1,4096,4096,9813.28, 47.9164, 7002.7,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,4096,4096,'(1:0)',4096,4096,14018.9, 17.1129, 19607.7,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,4096,4096,'(1:0)',4096,4096,14377.1, 35.1002, 19119.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,4608,4608,1,4608,4608,14208.2, 30.8338, 6886.5,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,4608,4608,1,4608,4608,10633.9, 46.1541, 9201.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,4608,4608,'(1:0)',4608,4608,15010.4, 16.2873, 26073.9,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,4608,4608,'(1:0)',4608,4608,14181, 30.7748, 27598.8,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,5120,5120,1,5120,5120,12314.8, 24.0523, 10898.9,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,5120,5120,1,5120,5120,11276.9, 44.0504, 11902,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,5120,5120,'(1:0)',5120,5120,16143.3, 15.7649, 33256.6,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,5120,5120,'(1:0)',5120,5120,15575, 30.4199, 34470.1,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,5632,5632,1,5632,5632,15249, 27.0757, 11715.1,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,5632,5632,1,5632,5632,12511.6, 44.4306, 14278.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,5632,5632,'(1:0)',5632,5632,17252.9, 15.3169, 41417.6,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,5632,5632,'(1:0)',5632,5632,16624.8, 29.5185, 42982.5,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,6144,6144,1,6144,6144,13450.3, 21.8918, 17243.3,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,6144,6144,1,6144,6144,12484.9, 40.6409, 18576.7,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,6144,6144,'(1:0)',6144,6144,17700.4, 14.4046, 52412,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,6144,6144,'(1:0)',6144,6144,17029.6, 27.7174, 54476.5,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,6656,6656,1,6656,6656,15441.9, 23.1999, 19095.9,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,6656,6656,1,6656,6656,13509.1, 40.5924, 21827.9,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,6656,6656,'(1:0)',6656,6656,18207.7, 13.6777, 64780.6,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,6656,6656,'(1:0)',6656,6656,17341.5, 26.0539, 68016.4,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,7168,7168,1,7168,7168,14391.4, 20.0773, 25591.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,7168,7168,1,7168,7168,12940.2, 36.1055, 28461.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,7168,7168,'(1:0)',7168,7168,18068.9, 12.6039, 81530.8,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,7168,7168,'(1:0)',7168,7168,17300.9, 24.1363, 85150.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,7680,7680,1,7680,7680,16124.1, 20.9949, 28093.7,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,7680,7680,1,7680,7680,15176.8, 39.5229, 29847.2,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,7680,7680,'(1:0)',7680,7680,18289.2, 11.907, 99071.4,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,7680,7680,'(1:0)',7680,7680,17520.4, 22.813, 103419,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_r,f32_r,f32_r,f32_r,f32_r,L,L,N,N,8192,8192,1,8192,8192,15440.3, 18.848, 35605.3,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_r,f64_r,f64_r,f64_r,f64_r,L,L,N,N,8192,8192,1,8192,8192,15690.9, 38.3079, 35036.6,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f32_c,f32_c,f32_c,f32_c,f32_c,L,L,N,N,8192,8192,'(1:0)',8192,8192,18517.7, 11.3023, 118752,
function,a_type,b_type,c_type,d_type,compute_type,side,uplo,transA,diag,M,N,alpha,lda,ldb,hipblas-Gflops,hipblas-GB/s,hipblas-us,
trmm,f64_c,f64_c,f64_c,f64_c,f64_c,L,L,N,N,8192,8192,'(1:0)',8192,8192,17758.4, 21.6778, 123830,
|